2 * Copyright (c) 1989, 1993
3 * The Regents of the University of California. All rights reserved.
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. Neither the name of the University nor the names of its contributors
17 * may be used to endorse or promote products derived from this software
18 * without specific prior written permission.
20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 #include <sys/cdefs.h>
35 __FBSDID("$FreeBSD$");
38 * Rpc op calls, generally called from the vnode op calls or through the
39 * buffer cache, for NFS v2, 3 and 4.
40 * These do not normally make any changes to vnode arguments or use
41 * structures that might change between the VFS variants. The returned
42 * arguments are all at the end, after the NFSPROC_T *p one.
46 #include "opt_inet6.h"
48 #include <fs/nfs/nfsport.h>
49 #include <sys/sysctl.h>
51 SYSCTL_DECL(_vfs_nfs);
53 static int nfsignore_eexist = 0;
54 SYSCTL_INT(_vfs_nfs, OID_AUTO, ignore_eexist, CTLFLAG_RW,
55 &nfsignore_eexist, 0, "NFS ignore EEXIST replies for mkdir/symlink");
60 extern int nfs_numnfscbd;
61 extern struct timeval nfsboottime;
62 extern u_int32_t newnfs_false, newnfs_true;
63 extern nfstype nfsv34_type[9];
64 extern int nfsrv_useacl;
65 extern char nfsv4_callbackaddr[INET6_ADDRSTRLEN];
66 extern int nfscl_debuglevel;
68 int nfstest_outofseq = 0;
69 int nfscl_assumeposixlocks = 1;
70 int nfscl_enablecallb = 0;
71 short nfsv4_cbport = NFSV4_CBPORT;
72 int nfstest_openallsetattr = 0;
73 #endif /* !APPLEKEXT */
75 #define DIRHDSIZ offsetof(struct dirent, d_name)
78 * nfscl_getsameserver() can return one of three values:
79 * NFSDSP_USETHISSESSION - Use this session for the DS.
80 * NFSDSP_SEQTHISSESSION - Use the nfsclds_sequence field of this dsp for new
82 * NFSDSP_NOTFOUND - No matching server was found.
85 NFSDSP_USETHISSESSION = 0,
86 NFSDSP_SEQTHISSESSION = 1,
90 static int nfsrpc_setattrrpc(vnode_t , struct vattr *, nfsv4stateid_t *,
91 struct ucred *, NFSPROC_T *, struct nfsvattr *, int *, void *);
92 static int nfsrpc_readrpc(vnode_t , struct uio *, struct ucred *,
93 nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *, void *);
94 static int nfsrpc_writerpc(vnode_t , struct uio *, int *, int *,
95 struct ucred *, nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *,
97 static int nfsrpc_createv23(vnode_t , char *, int, struct vattr *,
98 nfsquad_t, int, struct ucred *, NFSPROC_T *, struct nfsvattr *,
99 struct nfsvattr *, struct nfsfh **, int *, int *, void *);
100 static int nfsrpc_createv4(vnode_t , char *, int, struct vattr *,
101 nfsquad_t, int, struct nfsclowner *, struct nfscldeleg **, struct ucred *,
102 NFSPROC_T *, struct nfsvattr *, struct nfsvattr *, struct nfsfh **, int *,
103 int *, void *, int *);
104 static int nfsrpc_locku(struct nfsrv_descript *, struct nfsmount *,
105 struct nfscllockowner *, u_int64_t, u_int64_t,
106 u_int32_t, struct ucred *, NFSPROC_T *, int);
107 static int nfsrpc_setaclrpc(vnode_t, struct ucred *, NFSPROC_T *,
108 struct acl *, nfsv4stateid_t *, void *);
109 static int nfsrpc_getlayout(struct nfsmount *, vnode_t, struct nfsfh *, int,
110 uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
111 struct ucred *, NFSPROC_T *);
112 static int nfsrpc_fillsa(struct nfsmount *, struct sockaddr_storage *,
113 struct nfsclds **, NFSPROC_T *);
114 static void nfscl_initsessionslots(struct nfsclsession *);
115 static int nfscl_doflayoutio(vnode_t, struct uio *, int *, int *, int *,
116 nfsv4stateid_t *, int, struct nfscldevinfo *, struct nfscllayout *,
117 struct nfsclflayout *, uint64_t, uint64_t, struct ucred *, NFSPROC_T *);
118 static int nfsrpc_readds(vnode_t, struct uio *, nfsv4stateid_t *, int *,
119 struct nfsclds *, uint64_t, int, struct nfsfh *, struct ucred *,
121 static int nfsrpc_writeds(vnode_t, struct uio *, int *, int *,
122 nfsv4stateid_t *, struct nfsclds *, uint64_t, int,
123 struct nfsfh *, int, struct ucred *, NFSPROC_T *);
124 static enum nfsclds_state nfscl_getsameserver(struct nfsmount *,
125 struct nfsclds *, struct nfsclds **);
127 static int nfsrpc_commitds(vnode_t, uint64_t, int, struct nfsclds *,
128 struct nfsfh *, struct ucred *, NFSPROC_T *, void *);
132 * nfs null call from vfs.
135 nfsrpc_null(vnode_t vp, struct ucred *cred, NFSPROC_T *p)
138 struct nfsrv_descript nfsd, *nd = &nfsd;
140 NFSCL_REQSTART(nd, NFSPROC_NULL, vp);
141 error = nfscl_request(nd, vp, p, cred, NULL);
142 if (nd->nd_repstat && !error)
143 error = nd->nd_repstat;
144 mbuf_freem(nd->nd_mrep);
150 * For nfs version 3 and 4, use the access rpc to check accessibility. If file
151 * modes are changed on the server, accesses might still fail later.
154 nfsrpc_access(vnode_t vp, int acmode, struct ucred *cred,
155 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp)
158 u_int32_t mode, rmode;
161 mode = NFSACCESS_READ;
164 if (vnode_vtype(vp) == VDIR) {
166 mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND |
169 mode |= NFSACCESS_LOOKUP;
172 mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND);
174 mode |= NFSACCESS_EXECUTE;
178 * Now, just call nfsrpc_accessrpc() to do the actual RPC.
180 error = nfsrpc_accessrpc(vp, mode, cred, p, nap, attrflagp, &rmode,
184 * The NFS V3 spec does not clarify whether or not
185 * the returned access bits can be a superset of
186 * the ones requested, so...
188 if (!error && (rmode & mode) != mode)
194 * The actual rpc, separated out for Darwin.
197 nfsrpc_accessrpc(vnode_t vp, u_int32_t mode, struct ucred *cred,
198 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, u_int32_t *rmodep,
202 u_int32_t supported, rmode;
204 struct nfsrv_descript nfsd, *nd = &nfsd;
205 nfsattrbit_t attrbits;
209 NFSCL_REQSTART(nd, NFSPROC_ACCESS, vp);
210 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
211 *tl = txdr_unsigned(mode);
212 if (nd->nd_flag & ND_NFSV4) {
214 * And do a Getattr op.
216 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
217 *tl = txdr_unsigned(NFSV4OP_GETATTR);
218 NFSGETATTR_ATTRBIT(&attrbits);
219 (void) nfsrv_putattrbit(nd, &attrbits);
221 error = nfscl_request(nd, vp, p, cred, stuff);
224 if (nd->nd_flag & ND_NFSV3) {
225 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
229 if (!nd->nd_repstat) {
230 if (nd->nd_flag & ND_NFSV4) {
231 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
232 supported = fxdr_unsigned(u_int32_t, *tl++);
234 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
236 rmode = fxdr_unsigned(u_int32_t, *tl);
237 if (nd->nd_flag & ND_NFSV4)
238 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
241 * It's not obvious what should be done about
242 * unsupported access modes. For now, be paranoid
243 * and clear the unsupported ones.
248 error = nd->nd_repstat;
250 mbuf_freem(nd->nd_mrep);
258 nfsrpc_open(vnode_t vp, int amode, struct ucred *cred, NFSPROC_T *p)
260 struct nfsclopen *op;
261 struct nfscldeleg *dp;
263 struct nfsnode *np = VTONFS(vp);
264 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
265 u_int32_t mode, clidrev;
266 int ret, newone, error, expireret = 0, retrycnt;
269 * For NFSv4, Open Ops are only done on Regular Files.
271 if (vnode_vtype(vp) != VREG)
275 mode |= NFSV4OPEN_ACCESSREAD;
277 mode |= NFSV4OPEN_ACCESSWRITE;
282 { char name[100]; int namel;
283 namel = (np->n_v4->n4_namelen < 100) ? np->n_v4->n4_namelen : 99;
284 bcopy(NFS4NODENAME(np->n_v4), name, namel);
286 printf("rpcopen p=0x%x name=%s",p->p_pid,name);
287 if (nfhp->nfh_len > 0) printf(" fh=0x%x\n",nfhp->nfh_fh[12]);
288 else printf(" fhl=0\n");
293 error = nfscl_open(vp, nfhp->nfh_fh, nfhp->nfh_len, mode, 1,
294 cred, p, NULL, &op, &newone, &ret, 1);
298 if (nmp->nm_clp != NULL)
299 clidrev = nmp->nm_clp->nfsc_clientidrev;
302 if (ret == NFSCLOPEN_DOOPEN) {
303 if (np->n_v4 != NULL) {
304 error = nfsrpc_openrpc(nmp, vp, np->n_v4->n4_data,
305 np->n_v4->n4_fhlen, np->n_fhp->nfh_fh,
306 np->n_fhp->nfh_len, mode, op,
307 NFS4NODENAME(np->n_v4), np->n_v4->n4_namelen, &dp,
308 0, 0x0, cred, p, 0, 0);
311 OSBitAndAtomic((int32_t)~NDELEGMOD, (UInt32 *)&np->n_flag);
314 np->n_flag &= ~NDELEGMOD;
316 * Invalidate the attribute cache, so that
317 * attributes that pre-date the issue of a
318 * delegation are not cached, since the
319 * cached attributes will remain valid while
320 * the delegation is held.
322 NFSINVALATTRCACHE(np);
325 (void) nfscl_deleg(nmp->nm_mountp,
326 op->nfso_own->nfsow_clp,
327 nfhp->nfh_fh, nfhp->nfh_len, cred, p, &dp);
332 newnfs_copyincred(cred, &op->nfso_cred);
333 } else if (ret == NFSCLOPEN_SETCRED)
335 * This is a new local open on a delegation. It needs
336 * to have credentials so that an open can be done
337 * against the server during recovery.
339 newnfs_copyincred(cred, &op->nfso_cred);
342 * nfso_opencnt is the count of how many VOP_OPEN()s have
343 * been done on this Open successfully and a VOP_CLOSE()
344 * is expected for each of these.
345 * If error is non-zero, don't increment it, since the Open
346 * hasn't succeeded yet.
350 nfscl_openrelease(nmp, op, error, newone);
351 if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
352 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
353 error == NFSERR_BADSESSION) {
354 (void) nfs_catnap(PZERO, error, "nfs_open");
355 } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
357 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
360 } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
361 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
362 error == NFSERR_BADSESSION ||
363 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
364 expireret == 0 && clidrev != 0 && retrycnt < 4));
365 if (error && retrycnt >= 4)
371 * the actual open rpc
374 nfsrpc_openrpc(struct nfsmount *nmp, vnode_t vp, u_int8_t *nfhp, int fhlen,
375 u_int8_t *newfhp, int newfhlen, u_int32_t mode, struct nfsclopen *op,
376 u_int8_t *name, int namelen, struct nfscldeleg **dpp,
377 int reclaim, u_int32_t delegtype, struct ucred *cred, NFSPROC_T *p,
378 int syscred, int recursed)
381 struct nfsrv_descript nfsd, *nd = &nfsd;
382 struct nfscldeleg *dp, *ndp = NULL;
383 struct nfsvattr nfsva;
384 u_int32_t rflags, deleg;
385 nfsattrbit_t attrbits;
386 int error, ret, acesize, limitby;
387 struct nfsclsession *tsep;
391 nfscl_reqstart(nd, NFSPROC_OPEN, nmp, nfhp, fhlen, NULL, NULL);
392 NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
393 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
394 *tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
395 *tl++ = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
396 tsep = nfsmnt_mdssession(nmp);
397 *tl++ = tsep->nfsess_clientid.lval[0];
398 *tl = tsep->nfsess_clientid.lval[1];
399 (void) nfsm_strtom(nd, op->nfso_own->nfsow_owner, NFSV4CL_LOCKNAMELEN);
400 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
401 *tl++ = txdr_unsigned(NFSV4OPEN_NOCREATE);
403 *tl = txdr_unsigned(NFSV4OPEN_CLAIMPREVIOUS);
404 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
405 *tl = txdr_unsigned(delegtype);
408 *tl = txdr_unsigned(NFSV4OPEN_CLAIMDELEGATECUR);
409 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
410 if (NFSHASNFSV4N(nmp))
413 *tl++ = dp->nfsdl_stateid.seqid;
414 *tl++ = dp->nfsdl_stateid.other[0];
415 *tl++ = dp->nfsdl_stateid.other[1];
416 *tl = dp->nfsdl_stateid.other[2];
418 *tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
420 (void) nfsm_strtom(nd, name, namelen);
422 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
423 *tl = txdr_unsigned(NFSV4OP_GETATTR);
424 NFSZERO_ATTRBIT(&attrbits);
425 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_CHANGE);
426 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TIMEMODIFY);
427 (void) nfsrv_putattrbit(nd, &attrbits);
429 nd->nd_flag |= ND_USEGSSNAME;
430 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
431 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
434 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
435 if (!nd->nd_repstat) {
436 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
438 op->nfso_stateid.seqid = *tl++;
439 op->nfso_stateid.other[0] = *tl++;
440 op->nfso_stateid.other[1] = *tl++;
441 op->nfso_stateid.other[2] = *tl;
442 rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
443 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
446 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
447 deleg = fxdr_unsigned(u_int32_t, *tl);
448 if (deleg == NFSV4OPEN_DELEGATEREAD ||
449 deleg == NFSV4OPEN_DELEGATEWRITE) {
450 if (!(op->nfso_own->nfsow_clp->nfsc_flags &
451 NFSCLFLAGS_FIRSTDELEG))
452 op->nfso_own->nfsow_clp->nfsc_flags |=
453 (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
454 MALLOC(ndp, struct nfscldeleg *,
455 sizeof (struct nfscldeleg) + newfhlen,
456 M_NFSCLDELEG, M_WAITOK);
457 LIST_INIT(&ndp->nfsdl_owner);
458 LIST_INIT(&ndp->nfsdl_lock);
459 ndp->nfsdl_clp = op->nfso_own->nfsow_clp;
460 ndp->nfsdl_fhlen = newfhlen;
461 NFSBCOPY(newfhp, ndp->nfsdl_fh, newfhlen);
462 newnfs_copyincred(cred, &ndp->nfsdl_cred);
463 nfscl_lockinit(&ndp->nfsdl_rwlock);
464 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
466 ndp->nfsdl_stateid.seqid = *tl++;
467 ndp->nfsdl_stateid.other[0] = *tl++;
468 ndp->nfsdl_stateid.other[1] = *tl++;
469 ndp->nfsdl_stateid.other[2] = *tl++;
470 ret = fxdr_unsigned(int, *tl);
471 if (deleg == NFSV4OPEN_DELEGATEWRITE) {
472 ndp->nfsdl_flags = NFSCLDL_WRITE;
474 * Indicates how much the file can grow.
476 NFSM_DISSECT(tl, u_int32_t *,
478 limitby = fxdr_unsigned(int, *tl++);
480 case NFSV4OPEN_LIMITSIZE:
481 ndp->nfsdl_sizelimit = fxdr_hyper(tl);
483 case NFSV4OPEN_LIMITBLOCKS:
484 ndp->nfsdl_sizelimit =
485 fxdr_unsigned(u_int64_t, *tl++);
486 ndp->nfsdl_sizelimit *=
487 fxdr_unsigned(u_int64_t, *tl);
490 error = NFSERR_BADXDR;
494 ndp->nfsdl_flags = NFSCLDL_READ;
497 ndp->nfsdl_flags |= NFSCLDL_RECALL;
498 error = nfsrv_dissectace(nd, &ndp->nfsdl_ace, &ret,
502 } else if (deleg != NFSV4OPEN_DELEGATENONE) {
503 error = NFSERR_BADXDR;
506 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
507 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
508 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
509 NULL, NULL, NULL, p, cred);
513 ndp->nfsdl_change = nfsva.na_filerev;
514 ndp->nfsdl_modtime = nfsva.na_mtime;
515 ndp->nfsdl_flags |= NFSCLDL_MODTIMESET;
517 if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM)) {
519 ret = nfsrpc_openconfirm(vp, newfhp, newfhlen, op,
521 if (ret == NFSERR_DELAY)
522 (void) nfs_catnap(PZERO, ret, "nfs_open");
523 } while (ret == NFSERR_DELAY);
526 if ((rflags & NFSV4OPEN_LOCKTYPEPOSIX) ||
527 nfscl_assumeposixlocks)
528 op->nfso_posixlock = 1;
530 op->nfso_posixlock = 0;
533 * If the server is handing out delegations, but we didn't
534 * get one because an OpenConfirm was required, try the
535 * Open again, to get a delegation. This is a harmless no-op,
536 * from a server's point of view.
538 if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM) &&
539 (op->nfso_own->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG)
540 && !error && dp == NULL && ndp == NULL && !recursed) {
542 ret = nfsrpc_openrpc(nmp, vp, nfhp, fhlen, newfhp,
543 newfhlen, mode, op, name, namelen, &ndp, 0, 0x0,
544 cred, p, syscred, 1);
545 if (ret == NFSERR_DELAY)
546 (void) nfs_catnap(PZERO, ret, "nfs_open2");
547 } while (ret == NFSERR_DELAY);
550 FREE((caddr_t)ndp, M_NFSCLDELEG);
553 if (ret == NFSERR_STALECLIENTID ||
554 ret == NFSERR_STALEDONTRECOVER ||
555 ret == NFSERR_BADSESSION)
560 if (nd->nd_repstat != 0 && error == 0)
561 error = nd->nd_repstat;
562 if (error == NFSERR_STALECLIENTID)
563 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
567 else if (ndp != NULL)
568 FREE((caddr_t)ndp, M_NFSCLDELEG);
569 mbuf_freem(nd->nd_mrep);
577 nfsrpc_opendowngrade(vnode_t vp, u_int32_t mode, struct nfsclopen *op,
578 struct ucred *cred, NFSPROC_T *p)
581 struct nfsrv_descript nfsd, *nd = &nfsd;
584 NFSCL_REQSTART(nd, NFSPROC_OPENDOWNGRADE, vp);
585 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 3 * NFSX_UNSIGNED);
586 if (NFSHASNFSV4N(VFSTONFS(vnode_mount(vp))))
589 *tl++ = op->nfso_stateid.seqid;
590 *tl++ = op->nfso_stateid.other[0];
591 *tl++ = op->nfso_stateid.other[1];
592 *tl++ = op->nfso_stateid.other[2];
593 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
594 *tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
595 *tl = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
596 error = nfscl_request(nd, vp, p, cred, NULL);
599 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
600 if (!nd->nd_repstat) {
601 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
602 op->nfso_stateid.seqid = *tl++;
603 op->nfso_stateid.other[0] = *tl++;
604 op->nfso_stateid.other[1] = *tl++;
605 op->nfso_stateid.other[2] = *tl;
607 if (nd->nd_repstat && error == 0)
608 error = nd->nd_repstat;
609 if (error == NFSERR_STALESTATEID)
610 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
612 mbuf_freem(nd->nd_mrep);
617 * V4 Close operation.
620 nfsrpc_close(vnode_t vp, int doclose, NFSPROC_T *p)
622 struct nfsclclient *clp;
625 if (vnode_vtype(vp) != VREG)
628 error = nfscl_doclose(vp, &clp, p);
630 error = nfscl_getclose(vp, &clp);
634 nfscl_clientrelease(clp);
642 nfsrpc_doclose(struct nfsmount *nmp, struct nfsclopen *op, NFSPROC_T *p)
644 struct nfsrv_descript nfsd, *nd = &nfsd;
645 struct nfscllockowner *lp, *nlp;
646 struct nfscllock *lop, *nlop;
648 u_int64_t off = 0, len = 0;
649 u_int32_t type = NFSV4LOCKT_READ;
650 int error, do_unlock, trycnt;
652 tcred = newnfs_getcred();
653 newnfs_copycred(&op->nfso_cred, tcred);
655 * (Theoretically this could be done in the same
656 * compound as the close, but having multiple
657 * sequenced Ops in the same compound might be
658 * too scary for some servers.)
660 if (op->nfso_posixlock) {
663 type = NFSV4LOCKT_READ;
667 * Since this function is only called from VOP_INACTIVE(), no
668 * other thread will be manipulating this Open. As such, the
669 * lock lists are not being changed by other threads, so it should
670 * be safe to do this without locking.
672 LIST_FOREACH(lp, &op->nfso_lock, nfsl_list) {
674 LIST_FOREACH_SAFE(lop, &lp->nfsl_lock, nfslo_list, nlop) {
675 if (op->nfso_posixlock == 0) {
676 off = lop->nfslo_first;
677 len = lop->nfslo_end - lop->nfslo_first;
678 if (lop->nfslo_type == F_WRLCK)
679 type = NFSV4LOCKT_WRITE;
681 type = NFSV4LOCKT_READ;
686 error = nfsrpc_locku(nd, nmp, lp, off,
687 len, type, tcred, p, 0);
688 if ((nd->nd_repstat == NFSERR_GRACE ||
689 nd->nd_repstat == NFSERR_DELAY) &&
691 (void) nfs_catnap(PZERO,
694 } while ((nd->nd_repstat == NFSERR_GRACE ||
695 nd->nd_repstat == NFSERR_DELAY) &&
696 error == 0 && trycnt++ < 5);
697 if (op->nfso_posixlock)
700 nfscl_freelock(lop, 0);
703 * Do a ReleaseLockOwner.
704 * The lock owner name nfsl_owner may be used by other opens for
705 * other files but the lock_owner4 name that nfsrpc_rellockown()
706 * puts on the wire has the file handle for this file appended
707 * to it, so it can be done now.
709 (void)nfsrpc_rellockown(nmp, lp, lp->nfsl_open->nfso_fh,
710 lp->nfsl_open->nfso_fhlen, tcred, p);
714 * There could be other Opens for different files on the same
715 * OpenOwner, so locking is required.
718 nfscl_lockexcl(&op->nfso_own->nfsow_rwlock, NFSCLSTATEMUTEXPTR);
721 error = nfscl_tryclose(op, tcred, nmp, p);
722 if (error == NFSERR_GRACE)
723 (void) nfs_catnap(PZERO, error, "nfs_close");
724 } while (error == NFSERR_GRACE);
726 nfscl_lockunlock(&op->nfso_own->nfsow_rwlock);
728 LIST_FOREACH_SAFE(lp, &op->nfso_lock, nfsl_list, nlp)
729 nfscl_freelockowner(lp, 0);
730 nfscl_freeopen(op, 0);
736 * The actual Close RPC.
739 nfsrpc_closerpc(struct nfsrv_descript *nd, struct nfsmount *nmp,
740 struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p,
746 nfscl_reqstart(nd, NFSPROC_CLOSE, nmp, op->nfso_fh,
747 op->nfso_fhlen, NULL, NULL);
748 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
749 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
750 if (NFSHASNFSV4N(nmp))
753 *tl++ = op->nfso_stateid.seqid;
754 *tl++ = op->nfso_stateid.other[0];
755 *tl++ = op->nfso_stateid.other[1];
756 *tl = op->nfso_stateid.other[2];
758 nd->nd_flag |= ND_USEGSSNAME;
759 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
760 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
763 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
764 if (nd->nd_repstat == 0)
765 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
766 error = nd->nd_repstat;
767 if (error == NFSERR_STALESTATEID)
768 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
770 mbuf_freem(nd->nd_mrep);
775 * V4 Open Confirm RPC.
778 nfsrpc_openconfirm(vnode_t vp, u_int8_t *nfhp, int fhlen,
779 struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p)
782 struct nfsrv_descript nfsd, *nd = &nfsd;
783 struct nfsmount *nmp;
786 nmp = VFSTONFS(vnode_mount(vp));
787 if (NFSHASNFSV4N(nmp))
788 return (0); /* No confirmation for NFSv4.1. */
789 nfscl_reqstart(nd, NFSPROC_OPENCONFIRM, nmp, nfhp, fhlen, NULL, NULL);
790 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
791 *tl++ = op->nfso_stateid.seqid;
792 *tl++ = op->nfso_stateid.other[0];
793 *tl++ = op->nfso_stateid.other[1];
794 *tl++ = op->nfso_stateid.other[2];
795 *tl = txdr_unsigned(op->nfso_own->nfsow_seqid);
796 error = nfscl_request(nd, vp, p, cred, NULL);
799 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
800 if (!nd->nd_repstat) {
801 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
802 op->nfso_stateid.seqid = *tl++;
803 op->nfso_stateid.other[0] = *tl++;
804 op->nfso_stateid.other[1] = *tl++;
805 op->nfso_stateid.other[2] = *tl;
807 error = nd->nd_repstat;
808 if (error == NFSERR_STALESTATEID)
809 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
811 mbuf_freem(nd->nd_mrep);
816 * Do the setclientid and setclientid confirm RPCs. Called from nfs_statfs()
817 * when a mount has just occurred and when the server replies NFSERR_EXPIRED.
820 nfsrpc_setclient(struct nfsmount *nmp, struct nfsclclient *clp, int reclaim,
821 struct ucred *cred, NFSPROC_T *p)
824 struct nfsrv_descript nfsd;
825 struct nfsrv_descript *nd = &nfsd;
826 nfsattrbit_t attrbits;
827 u_int8_t *cp = NULL, *cp2, addr[INET6_ADDRSTRLEN + 9];
829 int error, isinet6 = 0, callblen;
832 static u_int32_t rev = 0;
835 struct nfsclsession *tsep;
837 if (nfsboottime.tv_sec == 0)
838 NFSSETBOOTTIME(nfsboottime);
839 clp->nfsc_rev = rev++;
840 if (NFSHASNFSV4N(nmp)) {
842 * Either there was no previous session or the
843 * previous session has failed, so...
844 * do an ExchangeID followed by the CreateSession.
846 error = nfsrpc_exchangeid(nmp, clp, &nmp->nm_sockreq,
847 NFSV4EXCH_USEPNFSMDS | NFSV4EXCH_USENONPNFS, &dsp, cred, p);
848 NFSCL_DEBUG(1, "aft exch=%d\n", error);
850 error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
852 dsp->nfsclds_sess.nfsess_sequenceid, 1, cred, p);
856 * The old sessions cannot be safely free'd
857 * here, since they may still be used by
861 if (TAILQ_FIRST(&nmp->nm_sess) != NULL)
862 tsep = NFSMNT_MDSSESSION(nmp);
863 TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp,
866 * Wake up RPCs waiting for a slot on the
867 * old session. These will then fail with
868 * NFSERR_BADSESSION and be retried with the
869 * new session by nfsv4_setsequence().
870 * Also wakeup() processes waiting for the
874 wakeup(&tsep->nfsess_slots);
875 wakeup(&nmp->nm_sess);
878 nfscl_freenfsclds(dsp);
879 NFSCL_DEBUG(1, "aft createsess=%d\n", error);
880 if (error == 0 && reclaim == 0) {
881 error = nfsrpc_reclaimcomplete(nmp, cred, p);
882 NFSCL_DEBUG(1, "aft reclaimcomp=%d\n", error);
883 if (error == NFSERR_COMPLETEALREADY ||
884 error == NFSERR_NOTSUPP)
885 /* Ignore this error. */
892 * Allocate a single session structure for NFSv4.0, because some of
893 * the fields are used by NFSv4.0 although it doesn't do a session.
895 dsp = malloc(sizeof(struct nfsclds), M_NFSCLDS, M_WAITOK | M_ZERO);
896 mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
897 mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession", NULL, MTX_DEF);
899 TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp, nfsclds_list);
900 tsep = NFSMNT_MDSSESSION(nmp);
903 nfscl_reqstart(nd, NFSPROC_SETCLIENTID, nmp, NULL, 0, NULL, NULL);
904 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
905 *tl++ = txdr_unsigned(nfsboottime.tv_sec);
906 *tl = txdr_unsigned(clp->nfsc_rev);
907 (void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
910 * set up the callback address
912 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
913 *tl = txdr_unsigned(NFS_CALLBCKPROG);
914 callblen = strlen(nfsv4_callbackaddr);
916 cp = nfscl_getmyip(nmp, &a6, &isinet6);
917 if (nfscl_enablecallb && nfs_numnfscbd > 0 &&
918 (callblen > 0 || cp != NULL)) {
919 port = htons(nfsv4_cbport);
920 cp2 = (u_int8_t *)&port;
923 strchr(nfsv4_callbackaddr, ':')) || isinet6) {
924 char ip6buf[INET6_ADDRSTRLEN], *ip6add;
926 (void) nfsm_strtom(nd, "tcp6", 4);
928 ip6_sprintf(ip6buf, (struct in6_addr *)cp);
931 ip6add = nfsv4_callbackaddr;
933 snprintf(addr, INET6_ADDRSTRLEN + 9, "%s.%d.%d",
934 ip6add, cp2[0], cp2[1]);
938 (void) nfsm_strtom(nd, "tcp", 3);
940 snprintf(addr, INET6_ADDRSTRLEN + 9,
941 "%d.%d.%d.%d.%d.%d", cp[0], cp[1],
942 cp[2], cp[3], cp2[0], cp2[1]);
944 snprintf(addr, INET6_ADDRSTRLEN + 9,
945 "%s.%d.%d", nfsv4_callbackaddr,
948 (void) nfsm_strtom(nd, addr, strlen(addr));
950 (void) nfsm_strtom(nd, "tcp", 3);
951 (void) nfsm_strtom(nd, "0.0.0.0.0.0", 11);
953 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
954 *tl = txdr_unsigned(clp->nfsc_cbident);
955 nd->nd_flag |= ND_USEGSSNAME;
956 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
957 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
960 if (nd->nd_repstat == 0) {
961 NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
962 tsep->nfsess_clientid.lval[0] = *tl++;
963 tsep->nfsess_clientid.lval[1] = *tl++;
964 confirm.lval[0] = *tl++;
965 confirm.lval[1] = *tl;
966 mbuf_freem(nd->nd_mrep);
972 nfscl_reqstart(nd, NFSPROC_SETCLIENTIDCFRM, nmp, NULL, 0, NULL,
974 NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
975 *tl++ = tsep->nfsess_clientid.lval[0];
976 *tl++ = tsep->nfsess_clientid.lval[1];
977 *tl++ = confirm.lval[0];
978 *tl = confirm.lval[1];
979 nd->nd_flag |= ND_USEGSSNAME;
980 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
981 cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
984 mbuf_freem(nd->nd_mrep);
986 if (nd->nd_repstat == 0) {
987 nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, nmp->nm_fh,
988 nmp->nm_fhsize, NULL, NULL);
989 NFSZERO_ATTRBIT(&attrbits);
990 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
991 (void) nfsrv_putattrbit(nd, &attrbits);
992 nd->nd_flag |= ND_USEGSSNAME;
993 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
994 cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
997 if (nd->nd_repstat == 0) {
998 error = nfsv4_loadattr(nd, NULL, NULL, NULL, NULL, 0, NULL,
999 NULL, NULL, NULL, NULL, 0, NULL, &lease, NULL, p, cred);
1002 clp->nfsc_renew = NFSCL_RENEW(lease);
1003 clp->nfsc_expire = NFSD_MONOSEC + clp->nfsc_renew;
1004 clp->nfsc_clientidrev++;
1005 if (clp->nfsc_clientidrev == 0)
1006 clp->nfsc_clientidrev++;
1010 error = nd->nd_repstat;
1012 mbuf_freem(nd->nd_mrep);
1020 nfsrpc_getattr(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
1021 struct nfsvattr *nap, void *stuff)
1023 struct nfsrv_descript nfsd, *nd = &nfsd;
1025 nfsattrbit_t attrbits;
1027 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
1028 if (nd->nd_flag & ND_NFSV4) {
1029 NFSGETATTR_ATTRBIT(&attrbits);
1030 (void) nfsrv_putattrbit(nd, &attrbits);
1032 error = nfscl_request(nd, vp, p, cred, stuff);
1035 if (!nd->nd_repstat)
1036 error = nfsm_loadattr(nd, nap);
1038 error = nd->nd_repstat;
1039 mbuf_freem(nd->nd_mrep);
1044 * nfs getattr call with non-vnode arguemnts.
1047 nfsrpc_getattrnovp(struct nfsmount *nmp, u_int8_t *fhp, int fhlen, int syscred,
1048 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, u_int64_t *xidp,
1051 struct nfsrv_descript nfsd, *nd = &nfsd;
1052 int error, vers = NFS_VER2;
1053 nfsattrbit_t attrbits;
1055 nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, fhp, fhlen, NULL, NULL);
1056 if (nd->nd_flag & ND_NFSV4) {
1058 NFSGETATTR_ATTRBIT(&attrbits);
1059 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
1060 (void) nfsrv_putattrbit(nd, &attrbits);
1061 } else if (nd->nd_flag & ND_NFSV3) {
1065 nd->nd_flag |= ND_USEGSSNAME;
1066 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
1067 NFS_PROG, vers, NULL, 1, xidp, NULL);
1070 if (nd->nd_repstat == 0) {
1071 if ((nd->nd_flag & ND_NFSV4) != 0)
1072 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
1073 NULL, NULL, NULL, NULL, NULL, 0, NULL, leasep, NULL,
1076 error = nfsm_loadattr(nd, nap);
1078 error = nd->nd_repstat;
1079 mbuf_freem(nd->nd_mrep);
1084 * Do an nfs setattr operation.
1087 nfsrpc_setattr(vnode_t vp, struct vattr *vap, NFSACL_T *aclp,
1088 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *rnap, int *attrflagp,
1091 int error, expireret = 0, openerr, retrycnt;
1092 u_int32_t clidrev = 0, mode;
1093 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1095 nfsv4stateid_t stateid;
1098 if (nmp->nm_clp != NULL)
1099 clidrev = nmp->nm_clp->nfsc_clientidrev;
1100 if (vap != NULL && NFSATTRISSET(u_quad_t, vap, va_size))
1101 mode = NFSV4OPEN_ACCESSWRITE;
1103 mode = NFSV4OPEN_ACCESSREAD;
1108 if (NFSHASNFSV4(nmp)) {
1109 nfhp = VTONFS(vp)->n_fhp;
1110 error = nfscl_getstateid(vp, nfhp->nfh_fh,
1111 nfhp->nfh_len, mode, 0, cred, p, &stateid, &lckp);
1112 if (error && vnode_vtype(vp) == VREG &&
1113 (mode == NFSV4OPEN_ACCESSWRITE ||
1114 nfstest_openallsetattr)) {
1116 * No Open stateid, so try and open the file
1119 if (mode == NFSV4OPEN_ACCESSWRITE)
1120 openerr = nfsrpc_open(vp, FWRITE, cred,
1123 openerr = nfsrpc_open(vp, FREAD, cred,
1126 (void) nfscl_getstateid(vp,
1127 nfhp->nfh_fh, nfhp->nfh_len,
1128 mode, 0, cred, p, &stateid, &lckp);
1132 error = nfsrpc_setattrrpc(vp, vap, &stateid, cred, p,
1133 rnap, attrflagp, stuff);
1135 error = nfsrpc_setaclrpc(vp, cred, p, aclp, &stateid,
1137 if (error == NFSERR_OPENMODE && mode == NFSV4OPEN_ACCESSREAD) {
1139 nmp->nm_state |= NFSSTA_OPENMODE;
1142 if (error == NFSERR_STALESTATEID)
1143 nfscl_initiate_recovery(nmp->nm_clp);
1145 nfscl_lockderef(lckp);
1147 (void) nfsrpc_close(vp, 0, p);
1148 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1149 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1150 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1151 (void) nfs_catnap(PZERO, error, "nfs_setattr");
1152 } else if ((error == NFSERR_EXPIRED ||
1153 error == NFSERR_BADSTATEID) && clidrev != 0) {
1154 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1157 } while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1158 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1159 error == NFSERR_BADSESSION ||
1160 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1161 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1162 expireret == 0 && clidrev != 0 && retrycnt < 4) ||
1163 (error == NFSERR_OPENMODE && mode == NFSV4OPEN_ACCESSREAD &&
1165 if (error && retrycnt >= 4)
1171 nfsrpc_setattrrpc(vnode_t vp, struct vattr *vap,
1172 nfsv4stateid_t *stateidp, struct ucred *cred, NFSPROC_T *p,
1173 struct nfsvattr *rnap, int *attrflagp, void *stuff)
1176 struct nfsrv_descript nfsd, *nd = &nfsd;
1178 nfsattrbit_t attrbits;
1181 NFSCL_REQSTART(nd, NFSPROC_SETATTR, vp);
1182 if (nd->nd_flag & ND_NFSV4)
1183 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1184 vap->va_type = vnode_vtype(vp);
1185 nfscl_fillsattr(nd, vap, vp, NFSSATTR_FULL, 0);
1186 if (nd->nd_flag & ND_NFSV3) {
1187 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1189 } else if (nd->nd_flag & ND_NFSV4) {
1190 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1191 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1192 NFSGETATTR_ATTRBIT(&attrbits);
1193 (void) nfsrv_putattrbit(nd, &attrbits);
1195 error = nfscl_request(nd, vp, p, cred, stuff);
1198 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1199 error = nfscl_wcc_data(nd, vp, rnap, attrflagp, NULL, stuff);
1200 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4 && !error)
1201 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1202 if (!(nd->nd_flag & ND_NFSV3) && !nd->nd_repstat && !error)
1203 error = nfscl_postop_attr(nd, rnap, attrflagp, stuff);
1204 mbuf_freem(nd->nd_mrep);
1205 if (nd->nd_repstat && !error)
1206 error = nd->nd_repstat;
1214 nfsrpc_lookup(vnode_t dvp, char *name, int len, struct ucred *cred,
1215 NFSPROC_T *p, struct nfsvattr *dnap, struct nfsvattr *nap,
1216 struct nfsfh **nfhpp, int *attrflagp, int *dattrflagp, void *stuff)
1219 struct nfsrv_descript nfsd, *nd = &nfsd;
1220 struct nfsmount *nmp;
1223 nfsattrbit_t attrbits;
1224 int error = 0, lookupp = 0;
1228 if (vnode_vtype(dvp) != VDIR)
1230 nmp = VFSTONFS(vnode_mount(dvp));
1231 if (len > NFS_MAXNAMLEN)
1232 return (ENAMETOOLONG);
1233 if (NFSHASNFSV4(nmp) && len == 1 &&
1236 * Just return the current dir's fh.
1239 MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1240 np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1241 nfhp->nfh_len = np->n_fhp->nfh_len;
1242 NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1246 if (NFSHASNFSV4(nmp) && len == 2 &&
1247 name[0] == '.' && name[1] == '.') {
1249 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, dvp);
1251 NFSCL_REQSTART(nd, NFSPROC_LOOKUP, dvp);
1252 (void) nfsm_strtom(nd, name, len);
1254 if (nd->nd_flag & ND_NFSV4) {
1255 NFSGETATTR_ATTRBIT(&attrbits);
1256 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1257 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
1258 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1259 (void) nfsrv_putattrbit(nd, &attrbits);
1261 error = nfscl_request(nd, dvp, p, cred, stuff);
1264 if (nd->nd_repstat) {
1266 * When an NFSv4 Lookupp returns ENOENT, it means that
1267 * the lookup is at the root of an fs, so return this dir.
1269 if (nd->nd_repstat == NFSERR_NOENT && lookupp) {
1271 MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1272 np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1273 nfhp->nfh_len = np->n_fhp->nfh_len;
1274 NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1276 mbuf_freem(nd->nd_mrep);
1279 if (nd->nd_flag & ND_NFSV3)
1280 error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1281 else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
1283 /* Load the directory attributes. */
1284 error = nfsm_loadattr(nd, dnap);
1290 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
1291 /* Load the directory attributes. */
1292 error = nfsm_loadattr(nd, dnap);
1296 /* Skip over the Lookup and GetFH operation status values. */
1297 NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1299 error = nfsm_getfh(nd, nfhpp);
1303 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1304 if ((nd->nd_flag & ND_NFSV3) && !error)
1305 error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1307 mbuf_freem(nd->nd_mrep);
1308 if (!error && nd->nd_repstat)
1309 error = nd->nd_repstat;
1314 * Do a readlink rpc.
1317 nfsrpc_readlink(vnode_t vp, struct uio *uiop, struct ucred *cred,
1318 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1321 struct nfsrv_descript nfsd, *nd = &nfsd;
1322 struct nfsnode *np = VTONFS(vp);
1323 nfsattrbit_t attrbits;
1324 int error, len, cangetattr = 1;
1327 NFSCL_REQSTART(nd, NFSPROC_READLINK, vp);
1328 if (nd->nd_flag & ND_NFSV4) {
1330 * And do a Getattr op.
1332 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1333 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1334 NFSGETATTR_ATTRBIT(&attrbits);
1335 (void) nfsrv_putattrbit(nd, &attrbits);
1337 error = nfscl_request(nd, vp, p, cred, stuff);
1340 if (nd->nd_flag & ND_NFSV3)
1341 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1342 if (!nd->nd_repstat && !error) {
1343 NFSM_STRSIZ(len, NFS_MAXPATHLEN);
1345 * This seems weird to me, but must have been added to
1346 * FreeBSD for some reason. The only thing I can think of
1347 * is that there was/is some server that replies with
1348 * more link data than it should?
1350 if (len == NFS_MAXPATHLEN) {
1352 if (np->n_size > 0 && np->n_size < NFS_MAXPATHLEN) {
1358 error = nfsm_mbufuio(nd, uiop, len);
1359 if ((nd->nd_flag & ND_NFSV4) && !error && cangetattr)
1360 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1362 if (nd->nd_repstat && !error)
1363 error = nd->nd_repstat;
1365 mbuf_freem(nd->nd_mrep);
1373 nfsrpc_read(vnode_t vp, struct uio *uiop, struct ucred *cred,
1374 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1376 int error, expireret = 0, retrycnt;
1377 u_int32_t clidrev = 0;
1378 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1379 struct nfsnode *np = VTONFS(vp);
1380 struct ucred *newcred;
1381 struct nfsfh *nfhp = NULL;
1382 nfsv4stateid_t stateid;
1385 if (nmp->nm_clp != NULL)
1386 clidrev = nmp->nm_clp->nfsc_clientidrev;
1388 if (NFSHASNFSV4(nmp)) {
1390 newcred = NFSNEWCRED(cred);
1395 if (NFSHASNFSV4(nmp))
1396 (void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1397 NFSV4OPEN_ACCESSREAD, 0, newcred, p, &stateid,
1399 error = nfsrpc_readrpc(vp, uiop, newcred, &stateid, p, nap,
1401 if (error == NFSERR_OPENMODE) {
1403 nmp->nm_state |= NFSSTA_OPENMODE;
1406 if (error == NFSERR_STALESTATEID)
1407 nfscl_initiate_recovery(nmp->nm_clp);
1409 nfscl_lockderef(lckp);
1410 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1411 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1412 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1413 (void) nfs_catnap(PZERO, error, "nfs_read");
1414 } else if ((error == NFSERR_EXPIRED ||
1415 error == NFSERR_BADSTATEID) && clidrev != 0) {
1416 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1419 } while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1420 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1421 error == NFSERR_BADSESSION ||
1422 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1423 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1424 expireret == 0 && clidrev != 0 && retrycnt < 4) ||
1425 (error == NFSERR_OPENMODE && retrycnt < 4));
1426 if (error && retrycnt >= 4)
1428 if (NFSHASNFSV4(nmp))
1429 NFSFREECRED(newcred);
1434 * The actual read RPC.
1437 nfsrpc_readrpc(vnode_t vp, struct uio *uiop, struct ucred *cred,
1438 nfsv4stateid_t *stateidp, NFSPROC_T *p, struct nfsvattr *nap,
1439 int *attrflagp, void *stuff)
1442 int error = 0, len, retlen, tsiz, eof = 0;
1443 struct nfsrv_descript nfsd;
1444 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1445 struct nfsrv_descript *nd = &nfsd;
1450 tsiz = uio_uio_resid(uiop);
1451 tmp_off = uiop->uio_offset + tsiz;
1453 if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1457 rsize = nmp->nm_rsize;
1462 len = (tsiz > rsize) ? rsize : tsiz;
1463 NFSCL_REQSTART(nd, NFSPROC_READ, vp);
1464 if (nd->nd_flag & ND_NFSV4)
1465 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1466 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED * 3);
1467 if (nd->nd_flag & ND_NFSV2) {
1468 *tl++ = txdr_unsigned(uiop->uio_offset);
1469 *tl++ = txdr_unsigned(len);
1472 txdr_hyper(uiop->uio_offset, tl);
1473 *(tl + 2) = txdr_unsigned(len);
1476 * Since I can't do a Getattr for NFSv4 for Write, there
1477 * doesn't seem any point in doing one here, either.
1478 * (See the comment in nfsrpc_writerpc() for more info.)
1480 error = nfscl_request(nd, vp, p, cred, stuff);
1483 if (nd->nd_flag & ND_NFSV3) {
1484 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1485 } else if (!nd->nd_repstat && (nd->nd_flag & ND_NFSV2)) {
1486 error = nfsm_loadattr(nd, nap);
1490 if (nd->nd_repstat || error) {
1492 error = nd->nd_repstat;
1495 if (nd->nd_flag & ND_NFSV3) {
1496 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1497 eof = fxdr_unsigned(int, *(tl + 1));
1498 } else if (nd->nd_flag & ND_NFSV4) {
1499 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
1500 eof = fxdr_unsigned(int, *tl);
1502 NFSM_STRSIZ(retlen, len);
1503 error = nfsm_mbufuio(nd, uiop, retlen);
1506 mbuf_freem(nd->nd_mrep);
1509 if (!(nd->nd_flag & ND_NFSV2)) {
1510 if (eof || retlen == 0)
1512 } else if (retlen < len)
1517 if (nd->nd_mrep != NULL)
1518 mbuf_freem(nd->nd_mrep);
1523 * nfs write operation
1524 * When called_from_strategy != 0, it should return EIO for an error that
1525 * indicates recovery is in progress, so that the buffer will be left
1526 * dirty and be written back to the server later. If it loops around,
1527 * the recovery thread could get stuck waiting for the buffer and recovery
1528 * will then deadlock.
1531 nfsrpc_write(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
1532 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
1533 void *stuff, int called_from_strategy)
1535 int error, expireret = 0, retrycnt, nostateid;
1536 u_int32_t clidrev = 0;
1537 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1538 struct nfsnode *np = VTONFS(vp);
1539 struct ucred *newcred;
1540 struct nfsfh *nfhp = NULL;
1541 nfsv4stateid_t stateid;
1545 if (nmp->nm_clp != NULL)
1546 clidrev = nmp->nm_clp->nfsc_clientidrev;
1548 if (NFSHASNFSV4(nmp)) {
1549 newcred = NFSNEWCRED(cred);
1556 if (NFSHASNFSV4(nmp)) {
1557 (void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1558 NFSV4OPEN_ACCESSWRITE, 0, newcred, p, &stateid,
1560 if (stateid.other[0] == 0 && stateid.other[1] == 0 &&
1561 stateid.other[2] == 0) {
1563 NFSCL_DEBUG(1, "stateid0 in write\n");
1568 * If there is no stateid for NFSv4, it means this is an
1569 * extraneous write after close. Basically a poorly
1570 * implemented buffer cache. Just don't do the write.
1575 error = nfsrpc_writerpc(vp, uiop, iomode, must_commit,
1576 newcred, &stateid, p, nap, attrflagp, stuff);
1577 if (error == NFSERR_STALESTATEID)
1578 nfscl_initiate_recovery(nmp->nm_clp);
1580 nfscl_lockderef(lckp);
1581 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1582 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1583 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1584 (void) nfs_catnap(PZERO, error, "nfs_write");
1585 } else if ((error == NFSERR_EXPIRED ||
1586 error == NFSERR_BADSTATEID) && clidrev != 0) {
1587 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1590 } while (error == NFSERR_GRACE || error == NFSERR_DELAY ||
1591 ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1592 error == NFSERR_STALEDONTRECOVER) && called_from_strategy == 0) ||
1593 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1594 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1595 expireret == 0 && clidrev != 0 && retrycnt < 4));
1596 if (error != 0 && (retrycnt >= 4 ||
1597 ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1598 error == NFSERR_STALEDONTRECOVER) && called_from_strategy != 0)))
1600 if (NFSHASNFSV4(nmp))
1601 NFSFREECRED(newcred);
1606 * The actual write RPC.
1609 nfsrpc_writerpc(vnode_t vp, struct uio *uiop, int *iomode,
1610 int *must_commit, struct ucred *cred, nfsv4stateid_t *stateidp,
1611 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1614 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1615 struct nfsnode *np = VTONFS(vp);
1616 int error = 0, len, tsiz, rlen, commit, committed = NFSWRITE_FILESYNC;
1617 int wccflag = 0, wsize;
1619 struct nfsrv_descript nfsd;
1620 struct nfsrv_descript *nd = &nfsd;
1621 nfsattrbit_t attrbits;
1624 KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
1626 tsiz = uio_uio_resid(uiop);
1627 tmp_off = uiop->uio_offset + tsiz;
1629 if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1633 wsize = nmp->nm_wsize;
1635 nd->nd_mrep = NULL; /* NFSv2 sometimes does a write with */
1636 nd->nd_repstat = 0; /* uio_resid == 0, so the while is not done */
1639 len = (tsiz > wsize) ? wsize : tsiz;
1640 NFSCL_REQSTART(nd, NFSPROC_WRITE, vp);
1641 if (nd->nd_flag & ND_NFSV4) {
1642 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1643 NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+2*NFSX_UNSIGNED);
1644 txdr_hyper(uiop->uio_offset, tl);
1646 *tl++ = txdr_unsigned(*iomode);
1647 *tl = txdr_unsigned(len);
1648 } else if (nd->nd_flag & ND_NFSV3) {
1649 NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+3*NFSX_UNSIGNED);
1650 txdr_hyper(uiop->uio_offset, tl);
1652 *tl++ = txdr_unsigned(len);
1653 *tl++ = txdr_unsigned(*iomode);
1654 *tl = txdr_unsigned(len);
1658 NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1660 * Not sure why someone changed this, since the
1661 * RFC clearly states that "beginoffset" and
1662 * "totalcount" are ignored, but it wouldn't
1663 * surprise me if there's a busted server out there.
1665 /* Set both "begin" and "current" to non-garbage. */
1666 x = txdr_unsigned((u_int32_t)uiop->uio_offset);
1667 *tl++ = x; /* "begin offset" */
1668 *tl++ = x; /* "current offset" */
1669 x = txdr_unsigned(len);
1670 *tl++ = x; /* total to this offset */
1671 *tl = x; /* size of this write */
1674 nfsm_uiombuf(nd, uiop, len);
1676 * Although it is tempting to do a normal Getattr Op in the
1677 * NFSv4 compound, the result can be a nearly hung client
1678 * system if the Getattr asks for Owner and/or OwnerGroup.
1679 * It occurs when the client can't map either the Owner or
1680 * Owner_group name in the Getattr reply to a uid/gid. When
1681 * there is a cache miss, the kernel does an upcall to the
1682 * nfsuserd. Then, it can try and read the local /etc/passwd
1683 * or /etc/group file. It can then block in getnewbuf(),
1684 * waiting for dirty writes to be pushed to the NFS server.
1685 * The only reason this doesn't result in a complete
1686 * deadlock, is that the upcall times out and allows
1687 * the write to complete. However, progress is so slow
1688 * that it might just as well be deadlocked.
1689 * As such, we get the rest of the attributes, but not
1690 * Owner or Owner_group.
1691 * nb: nfscl_loadattrcache() needs to be told that these
1692 * partial attributes from a write rpc are being
1693 * passed in, via a argument flag.
1695 if (nd->nd_flag & ND_NFSV4) {
1696 NFSWRITEGETATTR_ATTRBIT(&attrbits);
1697 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1698 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1699 (void) nfsrv_putattrbit(nd, &attrbits);
1701 error = nfscl_request(nd, vp, p, cred, stuff);
1704 if (nd->nd_repstat) {
1706 * In case the rpc gets retried, roll
1707 * the uio fileds changed by nfsm_uiombuf()
1710 uiop->uio_offset -= len;
1711 uio_uio_resid_add(uiop, len);
1712 uio_iov_base_add(uiop, -len);
1713 uio_iov_len_add(uiop, len);
1715 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1716 error = nfscl_wcc_data(nd, vp, nap, attrflagp,
1721 if (!nd->nd_repstat) {
1722 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1723 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED
1725 rlen = fxdr_unsigned(int, *tl++);
1729 } else if (rlen < len) {
1730 backup = len - rlen;
1731 uio_iov_base_add(uiop, -(backup));
1732 uio_iov_len_add(uiop, backup);
1733 uiop->uio_offset -= backup;
1734 uio_uio_resid_add(uiop, backup);
1737 commit = fxdr_unsigned(int, *tl++);
1740 * Return the lowest commitment level
1741 * obtained by any of the RPCs.
1743 if (committed == NFSWRITE_FILESYNC)
1745 else if (committed == NFSWRITE_DATASYNC &&
1746 commit == NFSWRITE_UNSTABLE)
1749 if (!NFSHASWRITEVERF(nmp)) {
1750 NFSBCOPY((caddr_t)tl,
1751 (caddr_t)&nmp->nm_verf[0],
1753 NFSSETWRITEVERF(nmp);
1754 } else if (NFSBCMP(tl, nmp->nm_verf,
1757 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
1761 if (nd->nd_flag & ND_NFSV4)
1762 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1763 if (nd->nd_flag & (ND_NFSV2 | ND_NFSV4)) {
1764 error = nfsm_loadattr(nd, nap);
1766 *attrflagp = NFS_LATTR_NOSHRINK;
1769 error = nd->nd_repstat;
1773 NFSWRITERPC_SETTIME(wccflag, np, nap, (nd->nd_flag & ND_NFSV4));
1774 mbuf_freem(nd->nd_mrep);
1779 if (nd->nd_mrep != NULL)
1780 mbuf_freem(nd->nd_mrep);
1781 *iomode = committed;
1782 if (nd->nd_repstat && !error)
1783 error = nd->nd_repstat;
1789 * For NFS v2 this is a kludge. Use a create rpc but with the IFMT bits of the
1790 * mode set to specify the file type and the size field for rdev.
1793 nfsrpc_mknod(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1794 u_int32_t rdev, enum vtype vtyp, struct ucred *cred, NFSPROC_T *p,
1795 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1796 int *attrflagp, int *dattrflagp, void *dstuff)
1800 struct nfsrv_descript nfsd, *nd = &nfsd;
1801 nfsattrbit_t attrbits;
1806 if (namelen > NFS_MAXNAMLEN)
1807 return (ENAMETOOLONG);
1808 NFSCL_REQSTART(nd, NFSPROC_MKNOD, dvp);
1809 if (nd->nd_flag & ND_NFSV4) {
1810 if (vtyp == VBLK || vtyp == VCHR) {
1811 NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
1812 *tl++ = vtonfsv34_type(vtyp);
1813 *tl++ = txdr_unsigned(NFSMAJOR(rdev));
1814 *tl = txdr_unsigned(NFSMINOR(rdev));
1816 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1817 *tl = vtonfsv34_type(vtyp);
1820 (void) nfsm_strtom(nd, name, namelen);
1821 if (nd->nd_flag & ND_NFSV3) {
1822 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1823 *tl = vtonfsv34_type(vtyp);
1825 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1826 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1827 if ((nd->nd_flag & ND_NFSV3) &&
1828 (vtyp == VCHR || vtyp == VBLK)) {
1829 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1830 *tl++ = txdr_unsigned(NFSMAJOR(rdev));
1831 *tl = txdr_unsigned(NFSMINOR(rdev));
1833 if (nd->nd_flag & ND_NFSV4) {
1834 NFSGETATTR_ATTRBIT(&attrbits);
1835 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1836 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
1837 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1838 (void) nfsrv_putattrbit(nd, &attrbits);
1840 if (nd->nd_flag & ND_NFSV2)
1841 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZERDEV, rdev);
1842 error = nfscl_request(nd, dvp, p, cred, dstuff);
1845 if (nd->nd_flag & ND_NFSV4)
1846 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1847 if (!nd->nd_repstat) {
1848 if (nd->nd_flag & ND_NFSV4) {
1849 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1850 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1854 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1858 if (nd->nd_flag & ND_NFSV3)
1859 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1860 if (!error && nd->nd_repstat)
1861 error = nd->nd_repstat;
1863 mbuf_freem(nd->nd_mrep);
1868 * nfs file create call
1869 * Mostly just call the approriate routine. (I separated out v4, so that
1870 * error recovery wouldn't be as difficult.)
1873 nfsrpc_create(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1874 nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1875 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1876 int *attrflagp, int *dattrflagp, void *dstuff)
1878 int error = 0, newone, expireret = 0, retrycnt, unlocked;
1879 struct nfsclowner *owp;
1880 struct nfscldeleg *dp;
1881 struct nfsmount *nmp = VFSTONFS(vnode_mount(dvp));
1884 if (NFSHASNFSV4(nmp)) {
1888 error = nfscl_open(dvp, NULL, 0, (NFSV4OPEN_ACCESSWRITE |
1889 NFSV4OPEN_ACCESSREAD), 0, cred, p, &owp, NULL, &newone,
1893 if (nmp->nm_clp != NULL)
1894 clidrev = nmp->nm_clp->nfsc_clientidrev;
1897 error = nfsrpc_createv4(dvp, name, namelen, vap, cverf, fmode,
1898 owp, &dp, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1901 * There is no need to invalidate cached attributes here,
1902 * since new post-delegation issue attributes are always
1903 * returned by nfsrpc_createv4() and these will update the
1907 (void) nfscl_deleg(nmp->nm_mountp, owp->nfsow_clp,
1908 (*nfhpp)->nfh_fh, (*nfhpp)->nfh_len, cred, p, &dp);
1909 nfscl_ownerrelease(nmp, owp, error, newone, unlocked);
1910 if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1911 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1912 error == NFSERR_BADSESSION) {
1913 (void) nfs_catnap(PZERO, error, "nfs_open");
1914 } else if ((error == NFSERR_EXPIRED ||
1915 error == NFSERR_BADSTATEID) && clidrev != 0) {
1916 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1919 } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1920 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1921 error == NFSERR_BADSESSION ||
1922 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1923 expireret == 0 && clidrev != 0 && retrycnt < 4));
1924 if (error && retrycnt >= 4)
1927 error = nfsrpc_createv23(dvp, name, namelen, vap, cverf,
1928 fmode, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1935 * The create rpc for v2 and 3.
1938 nfsrpc_createv23(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1939 nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1940 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1941 int *attrflagp, int *dattrflagp, void *dstuff)
1945 struct nfsrv_descript nfsd, *nd = &nfsd;
1950 if (namelen > NFS_MAXNAMLEN)
1951 return (ENAMETOOLONG);
1952 NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1953 (void) nfsm_strtom(nd, name, namelen);
1954 if (nd->nd_flag & ND_NFSV3) {
1955 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1956 if (fmode & O_EXCL) {
1957 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1958 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1959 *tl++ = cverf.lval[0];
1960 *tl = cverf.lval[1];
1962 *tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1963 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1966 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZE0, 0);
1968 error = nfscl_request(nd, dvp, p, cred, dstuff);
1971 if (nd->nd_repstat == 0) {
1972 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1976 if (nd->nd_flag & ND_NFSV3)
1977 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1978 if (nd->nd_repstat != 0 && error == 0)
1979 error = nd->nd_repstat;
1981 mbuf_freem(nd->nd_mrep);
1986 nfsrpc_createv4(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1987 nfsquad_t cverf, int fmode, struct nfsclowner *owp, struct nfscldeleg **dpp,
1988 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
1989 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
1990 int *dattrflagp, void *dstuff, int *unlockedp)
1993 int error = 0, deleg, newone, ret, acesize, limitby;
1994 struct nfsrv_descript nfsd, *nd = &nfsd;
1995 struct nfsclopen *op;
1996 struct nfscldeleg *dp = NULL;
1999 nfsattrbit_t attrbits;
2000 nfsv4stateid_t stateid;
2002 struct nfsmount *nmp;
2003 struct nfsclsession *tsep;
2005 nmp = VFSTONFS(dvp->v_mount);
2012 if (namelen > NFS_MAXNAMLEN)
2013 return (ENAMETOOLONG);
2014 NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
2016 * For V4, this is actually an Open op.
2018 NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2019 *tl++ = txdr_unsigned(owp->nfsow_seqid);
2020 *tl++ = txdr_unsigned(NFSV4OPEN_ACCESSWRITE |
2021 NFSV4OPEN_ACCESSREAD);
2022 *tl++ = txdr_unsigned(NFSV4OPEN_DENYNONE);
2023 tsep = nfsmnt_mdssession(nmp);
2024 *tl++ = tsep->nfsess_clientid.lval[0];
2025 *tl = tsep->nfsess_clientid.lval[1];
2026 (void) nfsm_strtom(nd, owp->nfsow_owner, NFSV4CL_LOCKNAMELEN);
2027 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2028 *tl++ = txdr_unsigned(NFSV4OPEN_CREATE);
2029 if (fmode & O_EXCL) {
2030 if (NFSHASNFSV4N(nmp)) {
2031 if (NFSHASSESSPERSIST(nmp)) {
2032 /* Use GUARDED for persistent sessions. */
2033 *tl = txdr_unsigned(NFSCREATE_GUARDED);
2034 nfscl_fillsattr(nd, vap, dvp, 0, 0);
2036 /* Otherwise, use EXCLUSIVE4_1. */
2037 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE41);
2038 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
2039 *tl++ = cverf.lval[0];
2040 *tl = cverf.lval[1];
2041 nfscl_fillsattr(nd, vap, dvp, 0, 0);
2045 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
2046 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
2047 *tl++ = cverf.lval[0];
2048 *tl = cverf.lval[1];
2051 *tl = txdr_unsigned(NFSCREATE_UNCHECKED);
2052 nfscl_fillsattr(nd, vap, dvp, 0, 0);
2054 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2055 *tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
2056 (void) nfsm_strtom(nd, name, namelen);
2057 /* Get the new file's handle and attributes. */
2058 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2059 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2060 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2061 NFSGETATTR_ATTRBIT(&attrbits);
2062 (void) nfsrv_putattrbit(nd, &attrbits);
2063 /* Get the directory's post-op attributes. */
2064 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2065 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2066 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh, np->n_fhp->nfh_len, 0);
2067 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2068 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2069 (void) nfsrv_putattrbit(nd, &attrbits);
2070 error = nfscl_request(nd, dvp, p, cred, dstuff);
2073 NFSCL_INCRSEQID(owp->nfsow_seqid, nd);
2074 if (nd->nd_repstat == 0) {
2075 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2077 stateid.seqid = *tl++;
2078 stateid.other[0] = *tl++;
2079 stateid.other[1] = *tl++;
2080 stateid.other[2] = *tl;
2081 rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
2082 (void) nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2083 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2084 deleg = fxdr_unsigned(int, *tl);
2085 if (deleg == NFSV4OPEN_DELEGATEREAD ||
2086 deleg == NFSV4OPEN_DELEGATEWRITE) {
2087 if (!(owp->nfsow_clp->nfsc_flags &
2088 NFSCLFLAGS_FIRSTDELEG))
2089 owp->nfsow_clp->nfsc_flags |=
2090 (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
2091 MALLOC(dp, struct nfscldeleg *,
2092 sizeof (struct nfscldeleg) + NFSX_V4FHMAX,
2093 M_NFSCLDELEG, M_WAITOK);
2094 LIST_INIT(&dp->nfsdl_owner);
2095 LIST_INIT(&dp->nfsdl_lock);
2096 dp->nfsdl_clp = owp->nfsow_clp;
2097 newnfs_copyincred(cred, &dp->nfsdl_cred);
2098 nfscl_lockinit(&dp->nfsdl_rwlock);
2099 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2101 dp->nfsdl_stateid.seqid = *tl++;
2102 dp->nfsdl_stateid.other[0] = *tl++;
2103 dp->nfsdl_stateid.other[1] = *tl++;
2104 dp->nfsdl_stateid.other[2] = *tl++;
2105 ret = fxdr_unsigned(int, *tl);
2106 if (deleg == NFSV4OPEN_DELEGATEWRITE) {
2107 dp->nfsdl_flags = NFSCLDL_WRITE;
2109 * Indicates how much the file can grow.
2111 NFSM_DISSECT(tl, u_int32_t *,
2113 limitby = fxdr_unsigned(int, *tl++);
2115 case NFSV4OPEN_LIMITSIZE:
2116 dp->nfsdl_sizelimit = fxdr_hyper(tl);
2118 case NFSV4OPEN_LIMITBLOCKS:
2119 dp->nfsdl_sizelimit =
2120 fxdr_unsigned(u_int64_t, *tl++);
2121 dp->nfsdl_sizelimit *=
2122 fxdr_unsigned(u_int64_t, *tl);
2125 error = NFSERR_BADXDR;
2129 dp->nfsdl_flags = NFSCLDL_READ;
2132 dp->nfsdl_flags |= NFSCLDL_RECALL;
2133 error = nfsrv_dissectace(nd, &dp->nfsdl_ace, &ret,
2137 } else if (deleg != NFSV4OPEN_DELEGATENONE) {
2138 error = NFSERR_BADXDR;
2141 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2144 /* Get rid of the PutFH and Getattr status values. */
2145 NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
2146 /* Load the directory attributes. */
2147 error = nfsm_loadattr(nd, dnap);
2151 if (dp != NULL && *attrflagp) {
2152 dp->nfsdl_change = nnap->na_filerev;
2153 dp->nfsdl_modtime = nnap->na_mtime;
2154 dp->nfsdl_flags |= NFSCLDL_MODTIMESET;
2157 * We can now complete the Open state.
2161 dp->nfsdl_fhlen = nfhp->nfh_len;
2162 NFSBCOPY(nfhp->nfh_fh, dp->nfsdl_fh, nfhp->nfh_len);
2165 * Get an Open structure that will be
2166 * attached to the OpenOwner, acquired already.
2168 error = nfscl_open(dvp, nfhp->nfh_fh, nfhp->nfh_len,
2169 (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), 0,
2170 cred, p, NULL, &op, &newone, NULL, 0);
2173 op->nfso_stateid = stateid;
2174 newnfs_copyincred(cred, &op->nfso_cred);
2175 if ((rflags & NFSV4OPEN_RESULTCONFIRM)) {
2177 ret = nfsrpc_openconfirm(dvp, nfhp->nfh_fh,
2178 nfhp->nfh_len, op, cred, p);
2179 if (ret == NFSERR_DELAY)
2180 (void) nfs_catnap(PZERO, ret, "nfs_create");
2181 } while (ret == NFSERR_DELAY);
2186 * If the server is handing out delegations, but we didn't
2187 * get one because an OpenConfirm was required, try the
2188 * Open again, to get a delegation. This is a harmless no-op,
2189 * from a server's point of view.
2191 if ((rflags & NFSV4OPEN_RESULTCONFIRM) &&
2192 (owp->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG) &&
2193 !error && dp == NULL) {
2195 ret = nfsrpc_openrpc(VFSTONFS(vnode_mount(dvp)), dvp,
2196 np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
2197 nfhp->nfh_fh, nfhp->nfh_len,
2198 (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), op,
2199 name, namelen, &dp, 0, 0x0, cred, p, 0, 1);
2200 if (ret == NFSERR_DELAY)
2201 (void) nfs_catnap(PZERO, ret, "nfs_crt2");
2202 } while (ret == NFSERR_DELAY);
2205 FREE((caddr_t)dp, M_NFSCLDELEG);
2208 if (ret == NFSERR_STALECLIENTID ||
2209 ret == NFSERR_STALEDONTRECOVER ||
2210 ret == NFSERR_BADSESSION)
2214 nfscl_openrelease(nmp, op, error, newone);
2217 if (nd->nd_repstat != 0 && error == 0)
2218 error = nd->nd_repstat;
2219 if (error == NFSERR_STALECLIENTID)
2220 nfscl_initiate_recovery(owp->nfsow_clp);
2224 else if (dp != NULL)
2225 FREE((caddr_t)dp, M_NFSCLDELEG);
2226 mbuf_freem(nd->nd_mrep);
2234 nfsrpc_remove(vnode_t dvp, char *name, int namelen, vnode_t vp,
2235 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp,
2239 struct nfsrv_descript nfsd, *nd = &nfsd;
2241 struct nfsmount *nmp;
2242 nfsv4stateid_t dstateid;
2243 int error, ret = 0, i;
2246 if (namelen > NFS_MAXNAMLEN)
2247 return (ENAMETOOLONG);
2248 nmp = VFSTONFS(vnode_mount(dvp));
2250 if (NFSHASNFSV4(nmp) && ret == 0) {
2251 ret = nfscl_removedeleg(vp, p, &dstateid);
2253 NFSCL_REQSTART(nd, NFSPROC_RETDELEGREMOVE, vp);
2254 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
2256 if (NFSHASNFSV4N(nmp))
2259 *tl++ = dstateid.seqid;
2260 *tl++ = dstateid.other[0];
2261 *tl++ = dstateid.other[1];
2262 *tl++ = dstateid.other[2];
2263 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2265 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2266 np->n_fhp->nfh_len, 0);
2267 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2268 *tl = txdr_unsigned(NFSV4OP_REMOVE);
2274 NFSCL_REQSTART(nd, NFSPROC_REMOVE, dvp);
2275 (void) nfsm_strtom(nd, name, namelen);
2276 error = nfscl_request(nd, dvp, p, cred, dstuff);
2279 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2280 /* For NFSv4, parse out any Delereturn replies. */
2281 if (ret > 0 && nd->nd_repstat != 0 &&
2282 (nd->nd_flag & ND_NOMOREDATA)) {
2284 * If the Delegreturn failed, try again without
2285 * it. The server will Recall, as required.
2287 mbuf_freem(nd->nd_mrep);
2290 for (i = 0; i < (ret * 2); i++) {
2291 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2293 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2295 nd->nd_flag |= ND_NOMOREDATA;
2298 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2300 if (nd->nd_repstat && !error)
2301 error = nd->nd_repstat;
2303 mbuf_freem(nd->nd_mrep);
2308 * Do an nfs rename rpc.
2311 nfsrpc_rename(vnode_t fdvp, vnode_t fvp, char *fnameptr, int fnamelen,
2312 vnode_t tdvp, vnode_t tvp, char *tnameptr, int tnamelen, struct ucred *cred,
2313 NFSPROC_T *p, struct nfsvattr *fnap, struct nfsvattr *tnap,
2314 int *fattrflagp, int *tattrflagp, void *fstuff, void *tstuff)
2317 struct nfsrv_descript nfsd, *nd = &nfsd;
2318 struct nfsmount *nmp;
2320 nfsattrbit_t attrbits;
2321 nfsv4stateid_t fdstateid, tdstateid;
2322 int error = 0, ret = 0, gottd = 0, gotfd = 0, i;
2326 nmp = VFSTONFS(vnode_mount(fdvp));
2327 if (fnamelen > NFS_MAXNAMLEN || tnamelen > NFS_MAXNAMLEN)
2328 return (ENAMETOOLONG);
2330 if (NFSHASNFSV4(nmp) && ret == 0) {
2331 ret = nfscl_renamedeleg(fvp, &fdstateid, &gotfd, tvp,
2332 &tdstateid, &gottd, p);
2333 if (gotfd && gottd) {
2334 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME2, fvp);
2336 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, fvp);
2338 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, tvp);
2341 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2342 if (NFSHASNFSV4N(nmp))
2345 *tl++ = fdstateid.seqid;
2346 *tl++ = fdstateid.other[0];
2347 *tl++ = fdstateid.other[1];
2348 *tl = fdstateid.other[2];
2350 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2351 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2353 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2354 np->n_fhp->nfh_len, 0);
2355 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2356 *tl = txdr_unsigned(NFSV4OP_DELEGRETURN);
2360 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2361 if (NFSHASNFSV4N(nmp))
2364 *tl++ = tdstateid.seqid;
2365 *tl++ = tdstateid.other[0];
2366 *tl++ = tdstateid.other[1];
2367 *tl = tdstateid.other[2];
2370 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2371 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2373 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2374 np->n_fhp->nfh_len, 0);
2375 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2376 *tl = txdr_unsigned(NFSV4OP_SAVEFH);
2382 NFSCL_REQSTART(nd, NFSPROC_RENAME, fdvp);
2383 if (nd->nd_flag & ND_NFSV4) {
2384 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2385 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2386 NFSWCCATTR_ATTRBIT(&attrbits);
2387 (void) nfsrv_putattrbit(nd, &attrbits);
2388 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2389 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2390 (void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2391 VTONFS(tdvp)->n_fhp->nfh_len, 0);
2392 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2393 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2394 (void) nfsrv_putattrbit(nd, &attrbits);
2395 nd->nd_flag |= ND_V4WCCATTR;
2396 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2397 *tl = txdr_unsigned(NFSV4OP_RENAME);
2399 (void) nfsm_strtom(nd, fnameptr, fnamelen);
2400 if (!(nd->nd_flag & ND_NFSV4))
2401 (void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2402 VTONFS(tdvp)->n_fhp->nfh_len, 0);
2403 (void) nfsm_strtom(nd, tnameptr, tnamelen);
2404 error = nfscl_request(nd, fdvp, p, cred, fstuff);
2407 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2408 /* For NFSv4, parse out any Delereturn replies. */
2409 if (ret > 0 && nd->nd_repstat != 0 &&
2410 (nd->nd_flag & ND_NOMOREDATA)) {
2412 * If the Delegreturn failed, try again without
2413 * it. The server will Recall, as required.
2415 mbuf_freem(nd->nd_mrep);
2418 for (i = 0; i < (ret * 2); i++) {
2419 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2421 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2423 if (i == 0 && ret > 1) {
2425 * If the Delegreturn failed, try again
2426 * without it. The server will Recall, as
2428 * If ret > 1, the first iteration of this
2429 * loop is the second DelegReturn result.
2431 mbuf_freem(nd->nd_mrep);
2434 nd->nd_flag |= ND_NOMOREDATA;
2439 /* Now, the first wcc attribute reply. */
2440 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2441 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2443 nd->nd_flag |= ND_NOMOREDATA;
2445 error = nfscl_wcc_data(nd, fdvp, fnap, fattrflagp, NULL,
2447 /* and the second wcc attribute reply. */
2448 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4 &&
2450 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2452 nd->nd_flag |= ND_NOMOREDATA;
2455 error = nfscl_wcc_data(nd, tdvp, tnap, tattrflagp,
2458 if (nd->nd_repstat && !error)
2459 error = nd->nd_repstat;
2461 mbuf_freem(nd->nd_mrep);
2466 * nfs hard link create rpc
2469 nfsrpc_link(vnode_t dvp, vnode_t vp, char *name, int namelen,
2470 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2471 struct nfsvattr *nap, int *attrflagp, int *dattrflagp, void *dstuff)
2474 struct nfsrv_descript nfsd, *nd = &nfsd;
2475 nfsattrbit_t attrbits;
2480 if (namelen > NFS_MAXNAMLEN)
2481 return (ENAMETOOLONG);
2482 NFSCL_REQSTART(nd, NFSPROC_LINK, vp);
2483 if (nd->nd_flag & ND_NFSV4) {
2484 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2485 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2487 (void) nfsm_fhtom(nd, VTONFS(dvp)->n_fhp->nfh_fh,
2488 VTONFS(dvp)->n_fhp->nfh_len, 0);
2489 if (nd->nd_flag & ND_NFSV4) {
2490 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2491 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2492 NFSWCCATTR_ATTRBIT(&attrbits);
2493 (void) nfsrv_putattrbit(nd, &attrbits);
2494 nd->nd_flag |= ND_V4WCCATTR;
2495 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2496 *tl = txdr_unsigned(NFSV4OP_LINK);
2498 (void) nfsm_strtom(nd, name, namelen);
2499 error = nfscl_request(nd, vp, p, cred, dstuff);
2502 if (nd->nd_flag & ND_NFSV3) {
2503 error = nfscl_postop_attr(nd, nap, attrflagp, dstuff);
2505 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2507 } else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2509 * First, parse out the PutFH and Getattr result.
2511 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2513 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2515 nd->nd_flag |= ND_NOMOREDATA;
2517 * Get the pre-op attributes.
2519 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2521 if (nd->nd_repstat && !error)
2522 error = nd->nd_repstat;
2524 mbuf_freem(nd->nd_mrep);
2529 * nfs symbolic link create rpc
2532 nfsrpc_symlink(vnode_t dvp, char *name, int namelen, char *target,
2533 struct vattr *vap, struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2534 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2535 int *dattrflagp, void *dstuff)
2538 struct nfsrv_descript nfsd, *nd = &nfsd;
2539 struct nfsmount *nmp;
2540 int slen, error = 0;
2545 nmp = VFSTONFS(vnode_mount(dvp));
2546 slen = strlen(target);
2547 if (slen > NFS_MAXPATHLEN || namelen > NFS_MAXNAMLEN)
2548 return (ENAMETOOLONG);
2549 NFSCL_REQSTART(nd, NFSPROC_SYMLINK, dvp);
2550 if (nd->nd_flag & ND_NFSV4) {
2551 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2552 *tl = txdr_unsigned(NFLNK);
2553 (void) nfsm_strtom(nd, target, slen);
2555 (void) nfsm_strtom(nd, name, namelen);
2556 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2557 nfscl_fillsattr(nd, vap, dvp, 0, 0);
2558 if (!(nd->nd_flag & ND_NFSV4))
2559 (void) nfsm_strtom(nd, target, slen);
2560 if (nd->nd_flag & ND_NFSV2)
2561 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2562 error = nfscl_request(nd, dvp, p, cred, dstuff);
2565 if (nd->nd_flag & ND_NFSV4)
2566 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2567 if ((nd->nd_flag & ND_NFSV3) && !error) {
2568 if (!nd->nd_repstat)
2569 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2571 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2574 if (nd->nd_repstat && !error)
2575 error = nd->nd_repstat;
2576 mbuf_freem(nd->nd_mrep);
2578 * Kludge: Map EEXIST => 0 assuming that it is a reply to a retry.
2579 * Only do this if vfs.nfs.ignore_eexist is set.
2580 * Never do this for NFSv4.1 or later minor versions, since sessions
2581 * should guarantee "exactly once" RPC semantics.
2583 if (error == EEXIST && nfsignore_eexist != 0 && (!NFSHASNFSV4(nmp) ||
2584 nmp->nm_minorvers == 0))
2593 nfsrpc_mkdir(vnode_t dvp, char *name, int namelen, struct vattr *vap,
2594 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2595 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2596 int *dattrflagp, void *dstuff)
2599 struct nfsrv_descript nfsd, *nd = &nfsd;
2600 nfsattrbit_t attrbits;
2603 struct nfsmount *nmp;
2608 nmp = VFSTONFS(vnode_mount(dvp));
2609 fhp = VTONFS(dvp)->n_fhp;
2610 if (namelen > NFS_MAXNAMLEN)
2611 return (ENAMETOOLONG);
2612 NFSCL_REQSTART(nd, NFSPROC_MKDIR, dvp);
2613 if (nd->nd_flag & ND_NFSV4) {
2614 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2615 *tl = txdr_unsigned(NFDIR);
2617 (void) nfsm_strtom(nd, name, namelen);
2618 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2619 if (nd->nd_flag & ND_NFSV4) {
2620 NFSGETATTR_ATTRBIT(&attrbits);
2621 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2622 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2623 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2624 (void) nfsrv_putattrbit(nd, &attrbits);
2625 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2626 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2627 (void) nfsm_fhtom(nd, fhp->nfh_fh, fhp->nfh_len, 0);
2628 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2629 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2630 (void) nfsrv_putattrbit(nd, &attrbits);
2632 error = nfscl_request(nd, dvp, p, cred, dstuff);
2635 if (nd->nd_flag & ND_NFSV4)
2636 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2637 if (!nd->nd_repstat && !error) {
2638 if (nd->nd_flag & ND_NFSV4) {
2639 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2640 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2643 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2644 if (error == 0 && (nd->nd_flag & ND_NFSV4) != 0) {
2645 /* Get rid of the PutFH and Getattr status values. */
2646 NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
2647 /* Load the directory attributes. */
2648 error = nfsm_loadattr(nd, dnap);
2653 if ((nd->nd_flag & ND_NFSV3) && !error)
2654 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2655 if (nd->nd_repstat && !error)
2656 error = nd->nd_repstat;
2658 mbuf_freem(nd->nd_mrep);
2660 * Kludge: Map EEXIST => 0 assuming that it is a reply to a retry.
2661 * Only do this if vfs.nfs.ignore_eexist is set.
2662 * Never do this for NFSv4.1 or later minor versions, since sessions
2663 * should guarantee "exactly once" RPC semantics.
2665 if (error == EEXIST && nfsignore_eexist != 0 && (!NFSHASNFSV4(nmp) ||
2666 nmp->nm_minorvers == 0))
2672 * nfs remove directory call
2675 nfsrpc_rmdir(vnode_t dvp, char *name, int namelen, struct ucred *cred,
2676 NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp, void *dstuff)
2678 struct nfsrv_descript nfsd, *nd = &nfsd;
2682 if (namelen > NFS_MAXNAMLEN)
2683 return (ENAMETOOLONG);
2684 NFSCL_REQSTART(nd, NFSPROC_RMDIR, dvp);
2685 (void) nfsm_strtom(nd, name, namelen);
2686 error = nfscl_request(nd, dvp, p, cred, dstuff);
2689 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2690 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2691 if (nd->nd_repstat && !error)
2692 error = nd->nd_repstat;
2693 mbuf_freem(nd->nd_mrep);
2695 * Kludge: Map ENOENT => 0 assuming that you have a reply to a retry.
2697 if (error == ENOENT)
2704 * Always returns with either uio_resid unchanged, if you are at the
2705 * end of the directory, or uio_resid == 0, with all DIRBLKSIZ chunks
2707 * I felt this would allow caching of directory blocks more easily
2708 * than returning a pertially filled block.
2709 * Directory offset cookies:
2710 * Oh my, what to do with them...
2711 * I can think of three ways to deal with them:
2712 * 1 - have the layer above these RPCs maintain a map between logical
2713 * directory byte offsets and the NFS directory offset cookies
2714 * 2 - pass the opaque directory offset cookies up into userland
2715 * and let the libc functions deal with them, via the system call
2716 * 3 - return them to userland in the "struct dirent", so future versions
2717 * of libc can use them and do whatever is necessary to make things work
2718 * above these rpc calls, in the meantime
2719 * For now, I do #3 by "hiding" the directory offset cookies after the
2720 * d_name field in struct dirent. This is space inside d_reclen that
2721 * will be ignored by anything that doesn't know about them.
2722 * The directory offset cookies are filled in as the last 8 bytes of
2723 * each directory entry, after d_name. Someday, the userland libc
2724 * functions may be able to use these. In the meantime, it satisfies
2725 * OpenBSD's requirements for cookies being returned.
2726 * If expects the directory offset cookie for the read to be in uio_offset
2727 * and returns the one for the next entry after this directory block in
2731 nfsrpc_readdir(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
2732 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
2733 int *eofp, void *stuff)
2736 struct dirent *dp = NULL;
2738 nfsquad_t cookie, ncookie;
2739 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
2740 struct nfsnode *dnp = VTONFS(vp);
2741 struct nfsvattr nfsva;
2742 struct nfsrv_descript nfsd, *nd = &nfsd;
2743 int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
2744 int reqsize, tryformoredirs = 1, readsize, eof = 0, gotmnton = 0;
2745 long dotfileid, dotdotfileid = 0;
2746 u_int32_t fakefileno = 0xffffffff, rderr;
2748 nfsattrbit_t attrbits, dattrbits;
2749 u_int32_t *tl2 = NULL;
2752 KASSERT(uiop->uio_iovcnt == 1 &&
2753 (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
2754 ("nfs readdirrpc bad uio"));
2757 * There is no point in reading a lot more than uio_resid, however
2758 * adding one additional DIRBLKSIZ makes sense. Since uio_resid
2759 * and nm_readdirsize are both exact multiples of DIRBLKSIZ, this
2760 * will never make readsize > nm_readdirsize.
2762 readsize = nmp->nm_readdirsize;
2763 if (readsize > uio_uio_resid(uiop))
2764 readsize = uio_uio_resid(uiop) + DIRBLKSIZ;
2769 tresid = uio_uio_resid(uiop);
2770 cookie.lval[0] = cookiep->nfsuquad[0];
2771 cookie.lval[1] = cookiep->nfsuquad[1];
2775 * For NFSv4, first create the "." and ".." entries.
2777 if (NFSHASNFSV4(nmp)) {
2778 reqsize = 6 * NFSX_UNSIGNED;
2779 NFSGETATTR_ATTRBIT(&dattrbits);
2780 NFSZERO_ATTRBIT(&attrbits);
2781 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
2782 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TYPE);
2783 if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
2784 NFSATTRBIT_MOUNTEDONFILEID)) {
2785 NFSSETBIT_ATTRBIT(&attrbits,
2786 NFSATTRBIT_MOUNTEDONFILEID);
2790 * Must fake it. Use the fileno, except when the
2791 * fsid is != to that of the directory. For that
2792 * case, generate a fake fileno that is not the same.
2794 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
2799 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
2801 if (uiop->uio_offset == 0) {
2802 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
2803 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2804 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2805 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2806 (void) nfsrv_putattrbit(nd, &attrbits);
2807 error = nfscl_request(nd, vp, p, cred, stuff);
2810 dotfileid = 0; /* Fake out the compiler. */
2811 if ((nd->nd_flag & ND_NOMOREDATA) == 0) {
2812 error = nfsm_loadattr(nd, &nfsva);
2815 dotfileid = nfsva.na_fileid;
2817 if (nd->nd_repstat == 0) {
2818 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2819 len = fxdr_unsigned(int, *(tl + 4));
2820 if (len > 0 && len <= NFSX_V4FHMAX)
2821 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2825 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2826 nfsva.na_mntonfileno = 0xffffffff;
2827 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2828 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2829 NULL, NULL, NULL, p, cred);
2831 dotdotfileid = dotfileid;
2832 } else if (gotmnton) {
2833 if (nfsva.na_mntonfileno != 0xffffffff)
2834 dotdotfileid = nfsva.na_mntonfileno;
2836 dotdotfileid = nfsva.na_fileid;
2837 } else if (nfsva.na_filesid[0] ==
2838 dnp->n_vattr.na_filesid[0] &&
2839 nfsva.na_filesid[1] ==
2840 dnp->n_vattr.na_filesid[1]) {
2841 dotdotfileid = nfsva.na_fileid;
2845 } while (fakefileno ==
2847 dotdotfileid = fakefileno;
2850 } else if (nd->nd_repstat == NFSERR_NOENT) {
2852 * Lookupp returns NFSERR_NOENT when we are
2853 * at the root, so just use the current dir.
2856 dotdotfileid = dotfileid;
2858 error = nd->nd_repstat;
2860 mbuf_freem(nd->nd_mrep);
2864 dp = (struct dirent *)uio_iov_base(uiop);
2866 dp->d_type = DT_DIR;
2867 dp->d_fileno = dotfileid;
2869 *((uint64_t *)dp->d_name) = 0; /* Zero pad it. */
2870 dp->d_name[0] = '.';
2871 dp->d_reclen = _GENERIC_DIRSIZ(dp) + NFSX_HYPER;
2873 * Just make these offset cookie 0.
2875 tl = (u_int32_t *)&dp->d_name[8];
2878 blksiz += dp->d_reclen;
2879 uio_uio_resid_add(uiop, -(dp->d_reclen));
2880 uiop->uio_offset += dp->d_reclen;
2881 uio_iov_base_add(uiop, dp->d_reclen);
2882 uio_iov_len_add(uiop, -(dp->d_reclen));
2883 dp = (struct dirent *)uio_iov_base(uiop);
2885 dp->d_type = DT_DIR;
2886 dp->d_fileno = dotdotfileid;
2888 *((uint64_t *)dp->d_name) = 0;
2889 dp->d_name[0] = '.';
2890 dp->d_name[1] = '.';
2891 dp->d_reclen = _GENERIC_DIRSIZ(dp) + NFSX_HYPER;
2893 * Just make these offset cookie 0.
2895 tl = (u_int32_t *)&dp->d_name[8];
2898 blksiz += dp->d_reclen;
2899 uio_uio_resid_add(uiop, -(dp->d_reclen));
2900 uiop->uio_offset += dp->d_reclen;
2901 uio_iov_base_add(uiop, dp->d_reclen);
2902 uio_iov_len_add(uiop, -(dp->d_reclen));
2904 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_RDATTRERROR);
2906 reqsize = 5 * NFSX_UNSIGNED;
2911 * Loop around doing readdir rpc's of size readsize.
2912 * The stopping criteria is EOF or buffer full.
2914 while (more_dirs && bigenough) {
2916 NFSCL_REQSTART(nd, NFSPROC_READDIR, vp);
2917 if (nd->nd_flag & ND_NFSV2) {
2918 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2919 *tl++ = cookie.lval[1];
2920 *tl = txdr_unsigned(readsize);
2922 NFSM_BUILD(tl, u_int32_t *, reqsize);
2923 *tl++ = cookie.lval[0];
2924 *tl++ = cookie.lval[1];
2925 if (cookie.qval == 0) {
2930 *tl++ = dnp->n_cookieverf.nfsuquad[0];
2931 *tl++ = dnp->n_cookieverf.nfsuquad[1];
2934 if (nd->nd_flag & ND_NFSV4) {
2935 *tl++ = txdr_unsigned(readsize);
2936 *tl = txdr_unsigned(readsize);
2937 (void) nfsrv_putattrbit(nd, &attrbits);
2938 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2939 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2940 (void) nfsrv_putattrbit(nd, &dattrbits);
2942 *tl = txdr_unsigned(readsize);
2945 error = nfscl_request(nd, vp, p, cred, stuff);
2948 if (!(nd->nd_flag & ND_NFSV2)) {
2949 if (nd->nd_flag & ND_NFSV3)
2950 error = nfscl_postop_attr(nd, nap, attrflagp,
2952 if (!nd->nd_repstat && !error) {
2953 NFSM_DISSECT(tl, u_int32_t *, NFSX_HYPER);
2955 dnp->n_cookieverf.nfsuquad[0] = *tl++;
2956 dnp->n_cookieverf.nfsuquad[1] = *tl;
2960 if (nd->nd_repstat || error) {
2962 error = nd->nd_repstat;
2965 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2966 more_dirs = fxdr_unsigned(int, *tl);
2970 /* loop through the dir entries, doctoring them to 4bsd form */
2971 while (more_dirs && bigenough) {
2972 if (nd->nd_flag & ND_NFSV4) {
2973 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2974 ncookie.lval[0] = *tl++;
2975 ncookie.lval[1] = *tl++;
2976 len = fxdr_unsigned(int, *tl);
2977 } else if (nd->nd_flag & ND_NFSV3) {
2978 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2979 nfsva.na_fileid = fxdr_hyper(tl);
2981 len = fxdr_unsigned(int, *tl);
2983 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2985 fxdr_unsigned(long, *tl++);
2986 len = fxdr_unsigned(int, *tl);
2988 if (len <= 0 || len > NFS_MAXNAMLEN) {
2992 tlen = roundup2(len, 8);
2994 tlen += 8; /* To ensure null termination. */
2995 left = DIRBLKSIZ - blksiz;
2996 if (_GENERIC_DIRLEN(len) + NFSX_HYPER > left) {
2997 dp->d_reclen += left;
2998 uio_iov_base_add(uiop, left);
2999 uio_iov_len_add(uiop, -(left));
3000 uio_uio_resid_add(uiop, -(left));
3001 uiop->uio_offset += left;
3004 if (_GENERIC_DIRLEN(len) + NFSX_HYPER >
3005 uio_uio_resid(uiop))
3008 dp = (struct dirent *)uio_iov_base(uiop);
3011 dp->d_reclen = _GENERIC_DIRLEN(len) +
3013 dp->d_type = DT_UNKNOWN;
3014 blksiz += dp->d_reclen;
3015 if (blksiz == DIRBLKSIZ)
3017 uio_uio_resid_add(uiop, -(DIRHDSIZ));
3018 uiop->uio_offset += DIRHDSIZ;
3019 uio_iov_base_add(uiop, DIRHDSIZ);
3020 uio_iov_len_add(uiop, -(DIRHDSIZ));
3021 error = nfsm_mbufuio(nd, uiop, len);
3024 cp = uio_iov_base(uiop);
3026 *cp = '\0'; /* null terminate */
3027 cp += tlen; /* points to cookie storage */
3028 tl2 = (u_int32_t *)cp;
3029 uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
3030 uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
3031 uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
3032 uiop->uio_offset += (tlen + NFSX_HYPER);
3034 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3038 if (nd->nd_flag & ND_NFSV4) {
3040 nfsva.na_mntonfileno = 0xffffffff;
3041 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
3042 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3043 NULL, NULL, &rderr, p, cred);
3046 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3047 } else if (nd->nd_flag & ND_NFSV3) {
3048 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3049 ncookie.lval[0] = *tl++;
3050 ncookie.lval[1] = *tl++;
3052 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
3053 ncookie.lval[0] = 0;
3054 ncookie.lval[1] = *tl++;
3057 if (nd->nd_flag & ND_NFSV4) {
3062 if (nfsva.na_mntonfileno != 0xffffffff)
3063 dp->d_fileno = nfsva.na_mntonfileno;
3065 dp->d_fileno = nfsva.na_fileid;
3066 } else if (nfsva.na_filesid[0] ==
3067 dnp->n_vattr.na_filesid[0] &&
3068 nfsva.na_filesid[1] ==
3069 dnp->n_vattr.na_filesid[1]) {
3070 dp->d_fileno = nfsva.na_fileid;
3074 } while (fakefileno ==
3076 dp->d_fileno = fakefileno;
3078 dp->d_type = vtonfs_dtype(nfsva.na_type);
3081 dp->d_fileno = nfsva.na_fileid;
3083 *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3085 *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3088 more_dirs = fxdr_unsigned(int, *tl);
3091 * If at end of rpc data, get the eof boolean
3094 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3095 eof = fxdr_unsigned(int, *tl);
3098 if (nd->nd_flag & ND_NFSV4) {
3099 error = nfscl_postop_attr(nd, nap, attrflagp,
3105 mbuf_freem(nd->nd_mrep);
3109 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3110 * by increasing d_reclen for the last record.
3113 left = DIRBLKSIZ - blksiz;
3114 dp->d_reclen += left;
3115 uio_iov_base_add(uiop, left);
3116 uio_iov_len_add(uiop, -(left));
3117 uio_uio_resid_add(uiop, -(left));
3118 uiop->uio_offset += left;
3122 * If returning no data, assume end of file.
3123 * If not bigenough, return not end of file, since you aren't
3124 * returning all the data
3125 * Otherwise, return the eof flag from the server.
3128 if (tresid == ((size_t)(uio_uio_resid(uiop))))
3130 else if (!bigenough)
3137 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3139 while (uio_uio_resid(uiop) > 0 && uio_uio_resid(uiop) != tresid) {
3140 dp = (struct dirent *)uio_iov_base(uiop);
3141 dp->d_type = DT_UNKNOWN;
3144 dp->d_name[0] = '\0';
3145 tl = (u_int32_t *)&dp->d_name[4];
3146 *tl++ = cookie.lval[0];
3147 *tl = cookie.lval[1];
3148 dp->d_reclen = DIRBLKSIZ;
3149 uio_iov_base_add(uiop, DIRBLKSIZ);
3150 uio_iov_len_add(uiop, -(DIRBLKSIZ));
3151 uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3152 uiop->uio_offset += DIRBLKSIZ;
3156 if (nd->nd_mrep != NULL)
3157 mbuf_freem(nd->nd_mrep);
3163 * NFS V3 readdir plus RPC. Used in place of nfsrpc_readdir().
3164 * (Also used for NFS V4 when mount flag set.)
3165 * (ditto above w.r.t. multiple of DIRBLKSIZ, etc.)
3168 nfsrpc_readdirplus(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
3169 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3170 int *eofp, void *stuff)
3173 struct dirent *dp = NULL;
3175 vnode_t newvp = NULLVP;
3176 struct nfsrv_descript nfsd, *nd = &nfsd;
3177 struct nameidata nami, *ndp = &nami;
3178 struct componentname *cnp = &ndp->ni_cnd;
3179 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3180 struct nfsnode *dnp = VTONFS(vp), *np;
3181 struct nfsvattr nfsva;
3183 nfsquad_t cookie, ncookie;
3184 int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
3185 int attrflag, tryformoredirs = 1, eof = 0, gotmnton = 0;
3186 int isdotdot = 0, unlocknewvp = 0;
3187 long dotfileid, dotdotfileid = 0, fileno = 0;
3189 nfsattrbit_t attrbits, dattrbits;
3191 u_int32_t *tl2 = NULL, fakefileno = 0xffffffff, rderr;
3192 struct timespec dctime;
3194 KASSERT(uiop->uio_iovcnt == 1 &&
3195 (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
3196 ("nfs readdirplusrpc bad uio"));
3197 timespecclear(&dctime);
3203 cookie.lval[0] = cookiep->nfsuquad[0];
3204 cookie.lval[1] = cookiep->nfsuquad[1];
3205 tresid = uio_uio_resid(uiop);
3208 * For NFSv4, first create the "." and ".." entries.
3210 if (NFSHASNFSV4(nmp)) {
3211 NFSGETATTR_ATTRBIT(&dattrbits);
3212 NFSZERO_ATTRBIT(&attrbits);
3213 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
3214 if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
3215 NFSATTRBIT_MOUNTEDONFILEID)) {
3216 NFSSETBIT_ATTRBIT(&attrbits,
3217 NFSATTRBIT_MOUNTEDONFILEID);
3221 * Must fake it. Use the fileno, except when the
3222 * fsid is != to that of the directory. For that
3223 * case, generate a fake fileno that is not the same.
3225 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
3230 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
3232 if (uiop->uio_offset == 0) {
3233 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
3234 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
3235 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
3236 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3237 (void) nfsrv_putattrbit(nd, &attrbits);
3238 error = nfscl_request(nd, vp, p, cred, stuff);
3241 dotfileid = 0; /* Fake out the compiler. */
3242 if ((nd->nd_flag & ND_NOMOREDATA) == 0) {
3243 error = nfsm_loadattr(nd, &nfsva);
3246 dctime = nfsva.na_ctime;
3247 dotfileid = nfsva.na_fileid;
3249 if (nd->nd_repstat == 0) {
3250 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
3251 len = fxdr_unsigned(int, *(tl + 4));
3252 if (len > 0 && len <= NFSX_V4FHMAX)
3253 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3257 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
3258 nfsva.na_mntonfileno = 0xffffffff;
3259 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
3260 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3261 NULL, NULL, NULL, p, cred);
3263 dotdotfileid = dotfileid;
3264 } else if (gotmnton) {
3265 if (nfsva.na_mntonfileno != 0xffffffff)
3266 dotdotfileid = nfsva.na_mntonfileno;
3268 dotdotfileid = nfsva.na_fileid;
3269 } else if (nfsva.na_filesid[0] ==
3270 dnp->n_vattr.na_filesid[0] &&
3271 nfsva.na_filesid[1] ==
3272 dnp->n_vattr.na_filesid[1]) {
3273 dotdotfileid = nfsva.na_fileid;
3277 } while (fakefileno ==
3279 dotdotfileid = fakefileno;
3282 } else if (nd->nd_repstat == NFSERR_NOENT) {
3284 * Lookupp returns NFSERR_NOENT when we are
3285 * at the root, so just use the current dir.
3288 dotdotfileid = dotfileid;
3290 error = nd->nd_repstat;
3292 mbuf_freem(nd->nd_mrep);
3296 dp = (struct dirent *)uio_iov_base(uiop);
3298 dp->d_type = DT_DIR;
3299 dp->d_fileno = dotfileid;
3301 *((uint64_t *)dp->d_name) = 0; /* Zero pad it. */
3302 dp->d_name[0] = '.';
3303 dp->d_reclen = _GENERIC_DIRSIZ(dp) + NFSX_HYPER;
3305 * Just make these offset cookie 0.
3307 tl = (u_int32_t *)&dp->d_name[8];
3310 blksiz += dp->d_reclen;
3311 uio_uio_resid_add(uiop, -(dp->d_reclen));
3312 uiop->uio_offset += dp->d_reclen;
3313 uio_iov_base_add(uiop, dp->d_reclen);
3314 uio_iov_len_add(uiop, -(dp->d_reclen));
3315 dp = (struct dirent *)uio_iov_base(uiop);
3317 dp->d_type = DT_DIR;
3318 dp->d_fileno = dotdotfileid;
3320 *((uint64_t *)dp->d_name) = 0;
3321 dp->d_name[0] = '.';
3322 dp->d_name[1] = '.';
3323 dp->d_reclen = _GENERIC_DIRSIZ(dp) + NFSX_HYPER;
3325 * Just make these offset cookie 0.
3327 tl = (u_int32_t *)&dp->d_name[8];
3330 blksiz += dp->d_reclen;
3331 uio_uio_resid_add(uiop, -(dp->d_reclen));
3332 uiop->uio_offset += dp->d_reclen;
3333 uio_iov_base_add(uiop, dp->d_reclen);
3334 uio_iov_len_add(uiop, -(dp->d_reclen));
3336 NFSREADDIRPLUS_ATTRBIT(&attrbits);
3338 NFSSETBIT_ATTRBIT(&attrbits,
3339 NFSATTRBIT_MOUNTEDONFILEID);
3343 * Loop around doing readdir rpc's of size nm_readdirsize.
3344 * The stopping criteria is EOF or buffer full.
3346 while (more_dirs && bigenough) {
3348 NFSCL_REQSTART(nd, NFSPROC_READDIRPLUS, vp);
3349 NFSM_BUILD(tl, u_int32_t *, 6 * NFSX_UNSIGNED);
3350 *tl++ = cookie.lval[0];
3351 *tl++ = cookie.lval[1];
3352 if (cookie.qval == 0) {
3357 *tl++ = dnp->n_cookieverf.nfsuquad[0];
3358 *tl++ = dnp->n_cookieverf.nfsuquad[1];
3361 *tl++ = txdr_unsigned(nmp->nm_readdirsize);
3362 *tl = txdr_unsigned(nmp->nm_readdirsize);
3363 if (nd->nd_flag & ND_NFSV4) {
3364 (void) nfsrv_putattrbit(nd, &attrbits);
3365 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3366 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3367 (void) nfsrv_putattrbit(nd, &dattrbits);
3369 error = nfscl_request(nd, vp, p, cred, stuff);
3372 if (nd->nd_flag & ND_NFSV3)
3373 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3374 if (nd->nd_repstat || error) {
3376 error = nd->nd_repstat;
3379 if ((nd->nd_flag & ND_NFSV3) != 0 && *attrflagp != 0)
3380 dctime = nap->na_ctime;
3381 NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3383 dnp->n_cookieverf.nfsuquad[0] = *tl++;
3384 dnp->n_cookieverf.nfsuquad[1] = *tl++;
3386 more_dirs = fxdr_unsigned(int, *tl);
3390 /* loop through the dir entries, doctoring them to 4bsd form */
3391 while (more_dirs && bigenough) {
3392 NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3393 if (nd->nd_flag & ND_NFSV4) {
3394 ncookie.lval[0] = *tl++;
3395 ncookie.lval[1] = *tl++;
3397 fileno = fxdr_unsigned(long, *++tl);
3400 len = fxdr_unsigned(int, *tl);
3401 if (len <= 0 || len > NFS_MAXNAMLEN) {
3405 tlen = roundup2(len, 8);
3407 tlen += 8; /* To ensure null termination. */
3408 left = DIRBLKSIZ - blksiz;
3409 if (_GENERIC_DIRLEN(len) + NFSX_HYPER > left) {
3410 dp->d_reclen += left;
3411 uio_iov_base_add(uiop, left);
3412 uio_iov_len_add(uiop, -(left));
3413 uio_uio_resid_add(uiop, -(left));
3414 uiop->uio_offset += left;
3417 if (_GENERIC_DIRLEN(len) + NFSX_HYPER >
3418 uio_uio_resid(uiop))
3421 dp = (struct dirent *)uio_iov_base(uiop);
3424 dp->d_reclen = _GENERIC_DIRLEN(len) +
3426 dp->d_type = DT_UNKNOWN;
3427 blksiz += dp->d_reclen;
3428 if (blksiz == DIRBLKSIZ)
3430 uio_uio_resid_add(uiop, -(DIRHDSIZ));
3431 uiop->uio_offset += DIRHDSIZ;
3432 uio_iov_base_add(uiop, DIRHDSIZ);
3433 uio_iov_len_add(uiop, -(DIRHDSIZ));
3434 cnp->cn_nameptr = uio_iov_base(uiop);
3435 cnp->cn_namelen = len;
3437 error = nfsm_mbufuio(nd, uiop, len);
3440 cp = uio_iov_base(uiop);
3443 cp += tlen; /* points to cookie storage */
3444 tl2 = (u_int32_t *)cp;
3445 if (len == 2 && cnp->cn_nameptr[0] == '.' &&
3446 cnp->cn_nameptr[1] == '.')
3450 uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
3451 uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
3452 uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
3453 uiop->uio_offset += (tlen + NFSX_HYPER);
3455 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3460 if (nd->nd_flag & ND_NFSV3) {
3461 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3462 ncookie.lval[0] = *tl++;
3463 ncookie.lval[1] = *tl++;
3464 attrflag = fxdr_unsigned(int, *tl);
3466 error = nfsm_loadattr(nd, &nfsva);
3470 NFSM_DISSECT(tl,u_int32_t *,NFSX_UNSIGNED);
3472 error = nfsm_getfh(nd, &nfhp);
3476 if (!attrflag && nfhp != NULL) {
3477 FREE((caddr_t)nfhp, M_NFSFH);
3482 nfsva.na_mntonfileno = 0xffffffff;
3483 error = nfsv4_loadattr(nd, NULL, &nfsva, &nfhp,
3484 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3485 NULL, NULL, &rderr, p, cred);
3491 if (nd->nd_flag & ND_NFSV4) {
3494 } else if (gotmnton) {
3495 if (nfsva.na_mntonfileno != 0xffffffff)
3496 dp->d_fileno = nfsva.na_mntonfileno;
3498 dp->d_fileno = nfsva.na_fileid;
3499 } else if (nfsva.na_filesid[0] ==
3500 dnp->n_vattr.na_filesid[0] &&
3501 nfsva.na_filesid[1] ==
3502 dnp->n_vattr.na_filesid[1]) {
3503 dp->d_fileno = nfsva.na_fileid;
3507 } while (fakefileno ==
3509 dp->d_fileno = fakefileno;
3512 dp->d_fileno = fileno;
3514 *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3516 *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3520 if (NFSRV_CMPFH(nfhp->nfh_fh, nfhp->nfh_len,
3521 dnp->n_fhp->nfh_fh, dnp->n_fhp->nfh_len)) {
3525 FREE((caddr_t)nfhp, M_NFSFH);
3527 } else if (isdotdot != 0) {
3529 * Skip doing a nfscl_nget() call for "..".
3530 * There's a race between acquiring the nfs
3531 * node here and lookups that look for the
3532 * directory being read (in the parent).
3533 * It would try to get a lock on ".." here,
3534 * owning the lock on the directory being
3535 * read. Lookup will hold the lock on ".."
3536 * and try to acquire the lock on the
3537 * directory being read.
3538 * If the directory is unlocked/relocked,
3539 * then there is a LOR with the buflock
3542 free(nfhp, M_NFSFH);
3544 error = nfscl_nget(vnode_mount(vp), vp,
3545 nfhp, cnp, p, &np, NULL, LK_EXCLUSIVE);
3552 if (newvp != NULLVP) {
3553 error = nfscl_loadattrcache(&newvp,
3554 &nfsva, NULL, NULL, 0, 0);
3563 vtonfs_dtype(np->n_vattr.na_type);
3565 NFSCNHASH(cnp, HASHINIT);
3566 if (cnp->cn_namelen <= NCHNAMLEN &&
3567 (newvp->v_type != VDIR ||
3568 dctime.tv_sec != 0)) {
3569 cache_enter_time(ndp->ni_dvp,
3572 newvp->v_type != VDIR ? NULL :
3582 } else if (nfhp != NULL) {
3583 FREE((caddr_t)nfhp, M_NFSFH);
3585 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3586 more_dirs = fxdr_unsigned(int, *tl);
3589 * If at end of rpc data, get the eof boolean
3592 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3593 eof = fxdr_unsigned(int, *tl);
3596 if (nd->nd_flag & ND_NFSV4) {
3597 error = nfscl_postop_attr(nd, nap, attrflagp,
3603 mbuf_freem(nd->nd_mrep);
3607 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3608 * by increasing d_reclen for the last record.
3611 left = DIRBLKSIZ - blksiz;
3612 dp->d_reclen += left;
3613 uio_iov_base_add(uiop, left);
3614 uio_iov_len_add(uiop, -(left));
3615 uio_uio_resid_add(uiop, -(left));
3616 uiop->uio_offset += left;
3620 * If returning no data, assume end of file.
3621 * If not bigenough, return not end of file, since you aren't
3622 * returning all the data
3623 * Otherwise, return the eof flag from the server.
3626 if (tresid == uio_uio_resid(uiop))
3628 else if (!bigenough)
3635 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3637 while (uio_uio_resid(uiop) > 0 && uio_uio_resid(uiop) != tresid) {
3638 dp = (struct dirent *)uio_iov_base(uiop);
3639 dp->d_type = DT_UNKNOWN;
3642 dp->d_name[0] = '\0';
3643 tl = (u_int32_t *)&dp->d_name[4];
3644 *tl++ = cookie.lval[0];
3645 *tl = cookie.lval[1];
3646 dp->d_reclen = DIRBLKSIZ;
3647 uio_iov_base_add(uiop, DIRBLKSIZ);
3648 uio_iov_len_add(uiop, -(DIRBLKSIZ));
3649 uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3650 uiop->uio_offset += DIRBLKSIZ;
3654 if (nd->nd_mrep != NULL)
3655 mbuf_freem(nd->nd_mrep);
3664 nfsrpc_commit(vnode_t vp, u_quad_t offset, int cnt, struct ucred *cred,
3665 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
3668 struct nfsrv_descript nfsd, *nd = &nfsd;
3669 nfsattrbit_t attrbits;
3671 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3674 NFSCL_REQSTART(nd, NFSPROC_COMMIT, vp);
3675 NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3676 txdr_hyper(offset, tl);
3678 *tl = txdr_unsigned(cnt);
3679 if (nd->nd_flag & ND_NFSV4) {
3681 * And do a Getattr op.
3683 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3684 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3685 NFSGETATTR_ATTRBIT(&attrbits);
3686 (void) nfsrv_putattrbit(nd, &attrbits);
3688 error = nfscl_request(nd, vp, p, cred, stuff);
3691 error = nfscl_wcc_data(nd, vp, nap, attrflagp, NULL, stuff);
3692 if (!error && !nd->nd_repstat) {
3693 NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
3695 if (NFSBCMP(nmp->nm_verf, tl, NFSX_VERF)) {
3696 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
3697 nd->nd_repstat = NFSERR_STALEWRITEVERF;
3700 if (nd->nd_flag & ND_NFSV4)
3701 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3704 if (!error && nd->nd_repstat)
3705 error = nd->nd_repstat;
3706 mbuf_freem(nd->nd_mrep);
3711 * NFS byte range lock rpc.
3712 * (Mostly just calls one of the three lower level RPC routines.)
3715 nfsrpc_advlock(vnode_t vp, off_t size, int op, struct flock *fl,
3716 int reclaim, struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3718 struct nfscllockowner *lp;
3719 struct nfsclclient *clp;
3721 struct nfsrv_descript nfsd, *nd = &nfsd;
3722 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3725 u_int32_t clidrev = 0;
3726 int error = 0, newone = 0, expireret = 0, retrycnt, donelocally;
3730 * Convert the flock structure into a start and end and do POSIX
3733 switch (fl->l_whence) {
3737 * Caller is responsible for adding any necessary offset
3738 * when SEEK_CUR is used.
3740 start = fl->l_start;
3744 start = size + fl->l_start;
3745 off = size + fl->l_start;
3752 if (fl->l_len != 0) {
3753 end = start + fl->l_len - 1;
3764 if (op == F_GETLK) {
3765 error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3768 error = nfscl_lockt(vp, clp, off, len, fl, p, id, flags);
3770 clidrev = clp->nfsc_clientidrev;
3771 error = nfsrpc_lockt(nd, vp, clp, off, len, fl, cred,
3773 } else if (error == -1) {
3776 nfscl_clientrelease(clp);
3777 } else if (op == F_UNLCK && fl->l_type == F_UNLCK) {
3779 * We must loop around for all lockowner cases.
3782 error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3786 error = nfscl_relbytelock(vp, off, len, cred, p, callcnt,
3787 clp, id, flags, &lp, &dorpc);
3789 * If it returns a NULL lp, we're done.
3793 nfscl_clientrelease(clp);
3795 nfscl_releasealllocks(clp, vp, p, id, flags);
3798 if (nmp->nm_clp != NULL)
3799 clidrev = nmp->nm_clp->nfsc_clientidrev;
3803 * If the server doesn't support Posix lock semantics,
3804 * only allow locks on the entire file, since it won't
3805 * handle overlapping byte ranges.
3806 * There might still be a problem when a lock
3807 * upgrade/downgrade (read<->write) occurs, since the
3808 * server "might" expect an unlock first?
3810 if (dorpc && (lp->nfsl_open->nfso_posixlock ||
3811 (off == 0 && len == NFS64BITSSET))) {
3813 * Since the lock records will go away, we must
3814 * wait for grace and delay here.
3817 error = nfsrpc_locku(nd, nmp, lp, off, len,
3818 NFSV4LOCKT_READ, cred, p, 0);
3819 if ((nd->nd_repstat == NFSERR_GRACE ||
3820 nd->nd_repstat == NFSERR_DELAY) &&
3822 (void) nfs_catnap(PZERO, (int)nd->nd_repstat,
3824 } while ((nd->nd_repstat == NFSERR_GRACE ||
3825 nd->nd_repstat == NFSERR_DELAY) && error == 0);
3828 } while (error == 0 && nd->nd_repstat == 0);
3829 nfscl_releasealllocks(clp, vp, p, id, flags);
3830 } else if (op == F_SETLK) {
3831 error = nfscl_getbytelock(vp, off, len, fl->l_type, cred, p,
3832 NULL, 0, id, flags, NULL, NULL, &lp, &newone, &donelocally);
3833 if (error || donelocally) {
3836 if (nmp->nm_clp != NULL)
3837 clidrev = nmp->nm_clp->nfsc_clientidrev;
3840 nfhp = VTONFS(vp)->n_fhp;
3841 if (!lp->nfsl_open->nfso_posixlock &&
3842 (off != 0 || len != NFS64BITSSET)) {
3845 error = nfsrpc_lock(nd, nmp, vp, nfhp->nfh_fh,
3846 nfhp->nfh_len, lp, newone, reclaim, off,
3847 len, fl->l_type, cred, p, 0);
3850 error = nd->nd_repstat;
3851 nfscl_lockrelease(lp, error, newone);
3856 error = nd->nd_repstat;
3857 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
3858 error == NFSERR_STALEDONTRECOVER ||
3859 error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3860 error == NFSERR_BADSESSION) {
3861 (void) nfs_catnap(PZERO, error, "nfs_advlock");
3862 } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
3864 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
3867 } while (error == NFSERR_GRACE ||
3868 error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3869 error == NFSERR_STALEDONTRECOVER || error == NFSERR_STALESTATEID ||
3870 error == NFSERR_BADSESSION ||
3871 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
3872 expireret == 0 && clidrev != 0 && retrycnt < 4));
3873 if (error && retrycnt >= 4)
3879 * The lower level routine for the LockT case.
3882 nfsrpc_lockt(struct nfsrv_descript *nd, vnode_t vp,
3883 struct nfsclclient *clp, u_int64_t off, u_int64_t len, struct flock *fl,
3884 struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3887 int error, type, size;
3888 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3890 struct nfsmount *nmp;
3891 struct nfsclsession *tsep;
3893 nmp = VFSTONFS(vp->v_mount);
3894 NFSCL_REQSTART(nd, NFSPROC_LOCKT, vp);
3895 NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3896 if (fl->l_type == F_RDLCK)
3897 *tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3899 *tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3900 txdr_hyper(off, tl);
3902 txdr_hyper(len, tl);
3904 tsep = nfsmnt_mdssession(nmp);
3905 *tl++ = tsep->nfsess_clientid.lval[0];
3906 *tl = tsep->nfsess_clientid.lval[1];
3907 nfscl_filllockowner(id, own, flags);
3909 NFSBCOPY(np->n_fhp->nfh_fh, &own[NFSV4CL_LOCKNAMELEN],
3910 np->n_fhp->nfh_len);
3911 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + np->n_fhp->nfh_len);
3912 error = nfscl_request(nd, vp, p, cred, NULL);
3915 if (nd->nd_repstat == 0) {
3916 fl->l_type = F_UNLCK;
3917 } else if (nd->nd_repstat == NFSERR_DENIED) {
3919 fl->l_whence = SEEK_SET;
3920 NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3921 fl->l_start = fxdr_hyper(tl);
3923 len = fxdr_hyper(tl);
3925 if (len == NFS64BITSSET)
3929 type = fxdr_unsigned(int, *tl++);
3930 if (type == NFSV4LOCKT_WRITE)
3931 fl->l_type = F_WRLCK;
3933 fl->l_type = F_RDLCK;
3935 * XXX For now, I have no idea what to do with the
3936 * conflicting lock_owner, so I'll just set the pid == 0
3937 * and skip over the lock_owner.
3939 fl->l_pid = (pid_t)0;
3941 size = fxdr_unsigned(int, *tl);
3942 if (size < 0 || size > NFSV4_OPAQUELIMIT)
3945 error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3946 } else if (nd->nd_repstat == NFSERR_STALECLIENTID)
3947 nfscl_initiate_recovery(clp);
3949 mbuf_freem(nd->nd_mrep);
3954 * Lower level function that performs the LockU RPC.
3957 nfsrpc_locku(struct nfsrv_descript *nd, struct nfsmount *nmp,
3958 struct nfscllockowner *lp, u_int64_t off, u_int64_t len,
3959 u_int32_t type, struct ucred *cred, NFSPROC_T *p, int syscred)
3964 nfscl_reqstart(nd, NFSPROC_LOCKU, nmp, lp->nfsl_open->nfso_fh,
3965 lp->nfsl_open->nfso_fhlen, NULL, NULL);
3966 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 6 * NFSX_UNSIGNED);
3967 *tl++ = txdr_unsigned(type);
3968 *tl = txdr_unsigned(lp->nfsl_seqid);
3969 if (nfstest_outofseq &&
3970 (arc4random() % nfstest_outofseq) == 0)
3971 *tl = txdr_unsigned(lp->nfsl_seqid + 1);
3973 if (NFSHASNFSV4N(nmp))
3976 *tl++ = lp->nfsl_stateid.seqid;
3977 *tl++ = lp->nfsl_stateid.other[0];
3978 *tl++ = lp->nfsl_stateid.other[1];
3979 *tl++ = lp->nfsl_stateid.other[2];
3980 txdr_hyper(off, tl);
3982 txdr_hyper(len, tl);
3984 nd->nd_flag |= ND_USEGSSNAME;
3985 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
3986 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3987 NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3990 if (nd->nd_repstat == 0) {
3991 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3992 lp->nfsl_stateid.seqid = *tl++;
3993 lp->nfsl_stateid.other[0] = *tl++;
3994 lp->nfsl_stateid.other[1] = *tl++;
3995 lp->nfsl_stateid.other[2] = *tl;
3996 } else if (nd->nd_repstat == NFSERR_STALESTATEID)
3997 nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3999 mbuf_freem(nd->nd_mrep);
4004 * The actual Lock RPC.
4007 nfsrpc_lock(struct nfsrv_descript *nd, struct nfsmount *nmp, vnode_t vp,
4008 u_int8_t *nfhp, int fhlen, struct nfscllockowner *lp, int newone,
4009 int reclaim, u_int64_t off, u_int64_t len, short type, struct ucred *cred,
4010 NFSPROC_T *p, int syscred)
4014 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
4015 struct nfsclsession *tsep;
4017 nfscl_reqstart(nd, NFSPROC_LOCK, nmp, nfhp, fhlen, NULL, NULL);
4018 NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
4019 if (type == F_RDLCK)
4020 *tl++ = txdr_unsigned(NFSV4LOCKT_READ);
4022 *tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
4023 *tl++ = txdr_unsigned(reclaim);
4024 txdr_hyper(off, tl);
4026 txdr_hyper(len, tl);
4030 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
4031 2 * NFSX_UNSIGNED + NFSX_HYPER);
4032 *tl++ = txdr_unsigned(lp->nfsl_open->nfso_own->nfsow_seqid);
4033 if (NFSHASNFSV4N(nmp))
4036 *tl++ = lp->nfsl_open->nfso_stateid.seqid;
4037 *tl++ = lp->nfsl_open->nfso_stateid.other[0];
4038 *tl++ = lp->nfsl_open->nfso_stateid.other[1];
4039 *tl++ = lp->nfsl_open->nfso_stateid.other[2];
4040 *tl++ = txdr_unsigned(lp->nfsl_seqid);
4041 tsep = nfsmnt_mdssession(nmp);
4042 *tl++ = tsep->nfsess_clientid.lval[0];
4043 *tl = tsep->nfsess_clientid.lval[1];
4044 NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
4045 NFSBCOPY(nfhp, &own[NFSV4CL_LOCKNAMELEN], fhlen);
4046 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
4049 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + NFSX_UNSIGNED);
4050 if (NFSHASNFSV4N(nmp))
4053 *tl++ = lp->nfsl_stateid.seqid;
4054 *tl++ = lp->nfsl_stateid.other[0];
4055 *tl++ = lp->nfsl_stateid.other[1];
4056 *tl++ = lp->nfsl_stateid.other[2];
4057 *tl = txdr_unsigned(lp->nfsl_seqid);
4058 if (nfstest_outofseq &&
4059 (arc4random() % nfstest_outofseq) == 0)
4060 *tl = txdr_unsigned(lp->nfsl_seqid + 1);
4063 nd->nd_flag |= ND_USEGSSNAME;
4064 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
4065 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4069 NFSCL_INCRSEQID(lp->nfsl_open->nfso_own->nfsow_seqid, nd);
4070 NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
4071 if (nd->nd_repstat == 0) {
4072 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
4073 lp->nfsl_stateid.seqid = *tl++;
4074 lp->nfsl_stateid.other[0] = *tl++;
4075 lp->nfsl_stateid.other[1] = *tl++;
4076 lp->nfsl_stateid.other[2] = *tl;
4077 } else if (nd->nd_repstat == NFSERR_DENIED) {
4078 NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
4079 size = fxdr_unsigned(int, *(tl + 7));
4080 if (size < 0 || size > NFSV4_OPAQUELIMIT)
4083 error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
4084 } else if (nd->nd_repstat == NFSERR_STALESTATEID)
4085 nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
4087 mbuf_freem(nd->nd_mrep);
4093 * (always called with the vp for the mount point)
4096 nfsrpc_statfs(vnode_t vp, struct nfsstatfs *sbp, struct nfsfsinfo *fsp,
4097 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4100 u_int32_t *tl = NULL;
4101 struct nfsrv_descript nfsd, *nd = &nfsd;
4102 struct nfsmount *nmp;
4103 nfsattrbit_t attrbits;
4107 nmp = VFSTONFS(vnode_mount(vp));
4108 if (NFSHASNFSV4(nmp)) {
4110 * For V4, you actually do a getattr.
4112 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4113 NFSSTATFS_GETATTRBIT(&attrbits);
4114 (void) nfsrv_putattrbit(nd, &attrbits);
4115 nd->nd_flag |= ND_USEGSSNAME;
4116 error = nfscl_request(nd, vp, p, cred, stuff);
4119 if (nd->nd_repstat == 0) {
4120 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4121 NULL, NULL, sbp, fsp, NULL, 0, NULL, NULL, NULL, p,
4124 nmp->nm_fsid[0] = nap->na_filesid[0];
4125 nmp->nm_fsid[1] = nap->na_filesid[1];
4126 NFSSETHASSETFSID(nmp);
4130 error = nd->nd_repstat;
4135 NFSCL_REQSTART(nd, NFSPROC_FSSTAT, vp);
4136 error = nfscl_request(nd, vp, p, cred, stuff);
4139 if (nd->nd_flag & ND_NFSV3) {
4140 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4144 if (nd->nd_repstat) {
4145 error = nd->nd_repstat;
4148 NFSM_DISSECT(tl, u_int32_t *,
4149 NFSX_STATFS(nd->nd_flag & ND_NFSV3));
4151 if (NFSHASNFSV3(nmp)) {
4152 sbp->sf_tbytes = fxdr_hyper(tl); tl += 2;
4153 sbp->sf_fbytes = fxdr_hyper(tl); tl += 2;
4154 sbp->sf_abytes = fxdr_hyper(tl); tl += 2;
4155 sbp->sf_tfiles = fxdr_hyper(tl); tl += 2;
4156 sbp->sf_ffiles = fxdr_hyper(tl); tl += 2;
4157 sbp->sf_afiles = fxdr_hyper(tl); tl += 2;
4158 sbp->sf_invarsec = fxdr_unsigned(u_int32_t, *tl);
4159 } else if (NFSHASNFSV4(nmp) == 0) {
4160 sbp->sf_tsize = fxdr_unsigned(u_int32_t, *tl++);
4161 sbp->sf_bsize = fxdr_unsigned(u_int32_t, *tl++);
4162 sbp->sf_blocks = fxdr_unsigned(u_int32_t, *tl++);
4163 sbp->sf_bfree = fxdr_unsigned(u_int32_t, *tl++);
4164 sbp->sf_bavail = fxdr_unsigned(u_int32_t, *tl);
4167 mbuf_freem(nd->nd_mrep);
4175 nfsrpc_pathconf(vnode_t vp, struct nfsv3_pathconf *pc,
4176 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4179 struct nfsrv_descript nfsd, *nd = &nfsd;
4180 struct nfsmount *nmp;
4182 nfsattrbit_t attrbits;
4186 nmp = VFSTONFS(vnode_mount(vp));
4187 if (NFSHASNFSV4(nmp)) {
4189 * For V4, you actually do a getattr.
4191 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4192 NFSPATHCONF_GETATTRBIT(&attrbits);
4193 (void) nfsrv_putattrbit(nd, &attrbits);
4194 nd->nd_flag |= ND_USEGSSNAME;
4195 error = nfscl_request(nd, vp, p, cred, stuff);
4198 if (nd->nd_repstat == 0) {
4199 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4200 pc, NULL, NULL, NULL, NULL, 0, NULL, NULL, NULL, p,
4205 error = nd->nd_repstat;
4208 NFSCL_REQSTART(nd, NFSPROC_PATHCONF, vp);
4209 error = nfscl_request(nd, vp, p, cred, stuff);
4212 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4213 if (nd->nd_repstat && !error)
4214 error = nd->nd_repstat;
4216 NFSM_DISSECT(tl, u_int32_t *, NFSX_V3PATHCONF);
4217 pc->pc_linkmax = fxdr_unsigned(u_int32_t, *tl++);
4218 pc->pc_namemax = fxdr_unsigned(u_int32_t, *tl++);
4219 pc->pc_notrunc = fxdr_unsigned(u_int32_t, *tl++);
4220 pc->pc_chownrestricted =
4221 fxdr_unsigned(u_int32_t, *tl++);
4222 pc->pc_caseinsensitive =
4223 fxdr_unsigned(u_int32_t, *tl++);
4224 pc->pc_casepreserving = fxdr_unsigned(u_int32_t, *tl);
4228 mbuf_freem(nd->nd_mrep);
4233 * nfs version 3 fsinfo rpc call
4236 nfsrpc_fsinfo(vnode_t vp, struct nfsfsinfo *fsp, struct ucred *cred,
4237 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
4240 struct nfsrv_descript nfsd, *nd = &nfsd;
4244 NFSCL_REQSTART(nd, NFSPROC_FSINFO, vp);
4245 error = nfscl_request(nd, vp, p, cred, stuff);
4248 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4249 if (nd->nd_repstat && !error)
4250 error = nd->nd_repstat;
4252 NFSM_DISSECT(tl, u_int32_t *, NFSX_V3FSINFO);
4253 fsp->fs_rtmax = fxdr_unsigned(u_int32_t, *tl++);
4254 fsp->fs_rtpref = fxdr_unsigned(u_int32_t, *tl++);
4255 fsp->fs_rtmult = fxdr_unsigned(u_int32_t, *tl++);
4256 fsp->fs_wtmax = fxdr_unsigned(u_int32_t, *tl++);
4257 fsp->fs_wtpref = fxdr_unsigned(u_int32_t, *tl++);
4258 fsp->fs_wtmult = fxdr_unsigned(u_int32_t, *tl++);
4259 fsp->fs_dtpref = fxdr_unsigned(u_int32_t, *tl++);
4260 fsp->fs_maxfilesize = fxdr_hyper(tl);
4262 fxdr_nfsv3time(tl, &fsp->fs_timedelta);
4264 fsp->fs_properties = fxdr_unsigned(u_int32_t, *tl);
4267 mbuf_freem(nd->nd_mrep);
4272 * This function performs the Renew RPC.
4275 nfsrpc_renew(struct nfsclclient *clp, struct nfsclds *dsp, struct ucred *cred,
4279 struct nfsrv_descript nfsd;
4280 struct nfsrv_descript *nd = &nfsd;
4281 struct nfsmount *nmp;
4283 struct nfssockreq *nrp;
4284 struct nfsclsession *tsep;
4286 nmp = clp->nfsc_nmp;
4290 nfscl_reqstart(nd, NFSPROC_RENEW, nmp, NULL, 0, NULL, NULL);
4292 nfscl_reqstart(nd, NFSPROC_RENEW, nmp, NULL, 0, NULL,
4293 &dsp->nfsclds_sess);
4294 if (!NFSHASNFSV4N(nmp)) {
4295 /* NFSv4.1 just uses a Sequence Op and not a Renew. */
4296 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4297 tsep = nfsmnt_mdssession(nmp);
4298 *tl++ = tsep->nfsess_clientid.lval[0];
4299 *tl = tsep->nfsess_clientid.lval[1];
4303 nrp = dsp->nfsclds_sockp;
4305 /* If NULL, use the MDS socket. */
4306 nrp = &nmp->nm_sockreq;
4307 nd->nd_flag |= ND_USEGSSNAME;
4309 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4310 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4312 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4313 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
4316 error = nd->nd_repstat;
4317 mbuf_freem(nd->nd_mrep);
4322 * This function performs the Releaselockowner RPC.
4325 nfsrpc_rellockown(struct nfsmount *nmp, struct nfscllockowner *lp,
4326 uint8_t *fh, int fhlen, struct ucred *cred, NFSPROC_T *p)
4328 struct nfsrv_descript nfsd, *nd = &nfsd;
4331 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
4332 struct nfsclsession *tsep;
4334 if (NFSHASNFSV4N(nmp)) {
4335 /* For NFSv4.1, do a FreeStateID. */
4336 nfscl_reqstart(nd, NFSPROC_FREESTATEID, nmp, NULL, 0, NULL,
4338 nfsm_stateidtom(nd, &lp->nfsl_stateid, NFSSTATEID_PUTSTATEID);
4340 nfscl_reqstart(nd, NFSPROC_RELEASELCKOWN, nmp, NULL, 0, NULL,
4342 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4343 tsep = nfsmnt_mdssession(nmp);
4344 *tl++ = tsep->nfsess_clientid.lval[0];
4345 *tl = tsep->nfsess_clientid.lval[1];
4346 NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
4347 NFSBCOPY(fh, &own[NFSV4CL_LOCKNAMELEN], fhlen);
4348 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
4350 nd->nd_flag |= ND_USEGSSNAME;
4351 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4352 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4355 error = nd->nd_repstat;
4356 mbuf_freem(nd->nd_mrep);
4361 * This function performs the Compound to get the mount pt FH.
4364 nfsrpc_getdirpath(struct nfsmount *nmp, u_char *dirpath, struct ucred *cred,
4368 struct nfsrv_descript nfsd;
4369 struct nfsrv_descript *nd = &nfsd;
4371 int error, cnt, len, setnil;
4374 nfscl_reqstart(nd, NFSPROC_PUTROOTFH, nmp, NULL, 0, &opcntp, NULL);
4382 while (*cp2 != '\0' && *cp2 != '/')
4389 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4390 *tl = txdr_unsigned(NFSV4OP_LOOKUP);
4391 nfsm_strtom(nd, cp, strlen(cp));
4397 } while (*cp != '\0');
4398 if (NFSHASNFSV4N(nmp))
4399 /* Has a Sequence Op done by nfscl_reqstart(). */
4400 *opcntp = txdr_unsigned(3 + cnt);
4402 *opcntp = txdr_unsigned(2 + cnt);
4403 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4404 *tl = txdr_unsigned(NFSV4OP_GETFH);
4405 nd->nd_flag |= ND_USEGSSNAME;
4406 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4407 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4410 if (nd->nd_repstat == 0) {
4411 NFSM_DISSECT(tl, u_int32_t *, (3 + 2 * cnt) * NFSX_UNSIGNED);
4412 tl += (2 + 2 * cnt);
4413 if ((len = fxdr_unsigned(int, *tl)) <= 0 ||
4415 nd->nd_repstat = NFSERR_BADXDR;
4417 nd->nd_repstat = nfsrv_mtostr(nd, nmp->nm_fh, len);
4418 if (nd->nd_repstat == 0)
4419 nmp->nm_fhsize = len;
4422 error = nd->nd_repstat;
4424 mbuf_freem(nd->nd_mrep);
4429 * This function performs the Delegreturn RPC.
4432 nfsrpc_delegreturn(struct nfscldeleg *dp, struct ucred *cred,
4433 struct nfsmount *nmp, NFSPROC_T *p, int syscred)
4436 struct nfsrv_descript nfsd;
4437 struct nfsrv_descript *nd = &nfsd;
4440 nfscl_reqstart(nd, NFSPROC_DELEGRETURN, nmp, dp->nfsdl_fh,
4441 dp->nfsdl_fhlen, NULL, NULL);
4442 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
4443 if (NFSHASNFSV4N(nmp))
4446 *tl++ = dp->nfsdl_stateid.seqid;
4447 *tl++ = dp->nfsdl_stateid.other[0];
4448 *tl++ = dp->nfsdl_stateid.other[1];
4449 *tl = dp->nfsdl_stateid.other[2];
4451 nd->nd_flag |= ND_USEGSSNAME;
4452 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4453 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4456 error = nd->nd_repstat;
4457 mbuf_freem(nd->nd_mrep);
4465 nfsrpc_getacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4466 struct acl *aclp, void *stuff)
4468 struct nfsrv_descript nfsd, *nd = &nfsd;
4470 nfsattrbit_t attrbits;
4471 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4473 if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4474 return (EOPNOTSUPP);
4475 NFSCL_REQSTART(nd, NFSPROC_GETACL, vp);
4476 NFSZERO_ATTRBIT(&attrbits);
4477 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4478 (void) nfsrv_putattrbit(nd, &attrbits);
4479 error = nfscl_request(nd, vp, p, cred, stuff);
4482 if (!nd->nd_repstat)
4483 error = nfsv4_loadattr(nd, vp, NULL, NULL, NULL, 0, NULL,
4484 NULL, NULL, NULL, aclp, 0, NULL, NULL, NULL, p, cred);
4486 error = nd->nd_repstat;
4487 mbuf_freem(nd->nd_mrep);
4495 nfsrpc_setacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4496 struct acl *aclp, void *stuff)
4499 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4501 if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4502 return (EOPNOTSUPP);
4503 error = nfsrpc_setattr(vp, NULL, aclp, cred, p, NULL, NULL, stuff);
4511 nfsrpc_setaclrpc(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4512 struct acl *aclp, nfsv4stateid_t *stateidp, void *stuff)
4514 struct nfsrv_descript nfsd, *nd = &nfsd;
4516 nfsattrbit_t attrbits;
4517 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4519 if (!NFSHASNFSV4(nmp))
4520 return (EOPNOTSUPP);
4521 NFSCL_REQSTART(nd, NFSPROC_SETACL, vp);
4522 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
4523 NFSZERO_ATTRBIT(&attrbits);
4524 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4525 (void) nfsv4_fillattr(nd, vnode_mount(vp), vp, aclp, NULL, NULL, 0,
4526 &attrbits, NULL, NULL, 0, 0, 0, 0, (uint64_t)0);
4527 error = nfscl_request(nd, vp, p, cred, stuff);
4530 /* Don't care about the pre/postop attributes */
4531 mbuf_freem(nd->nd_mrep);
4532 return (nd->nd_repstat);
4536 * Do the NFSv4.1 Exchange ID.
4539 nfsrpc_exchangeid(struct nfsmount *nmp, struct nfsclclient *clp,
4540 struct nfssockreq *nrp, uint32_t exchflags, struct nfsclds **dspp,
4541 struct ucred *cred, NFSPROC_T *p)
4543 uint32_t *tl, v41flags;
4544 struct nfsrv_descript nfsd;
4545 struct nfsrv_descript *nd = &nfsd;
4546 struct nfsclds *dsp;
4547 struct timespec verstime;
4551 nfscl_reqstart(nd, NFSPROC_EXCHANGEID, nmp, NULL, 0, NULL, NULL);
4552 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4553 *tl++ = txdr_unsigned(nfsboottime.tv_sec); /* Client owner */
4554 *tl = txdr_unsigned(clp->nfsc_rev);
4555 (void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
4557 NFSM_BUILD(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4558 *tl++ = txdr_unsigned(exchflags);
4559 *tl++ = txdr_unsigned(NFSV4EXCH_SP4NONE);
4561 /* Set the implementation id4 */
4562 *tl = txdr_unsigned(1);
4563 (void) nfsm_strtom(nd, "freebsd.org", strlen("freebsd.org"));
4564 (void) nfsm_strtom(nd, version, strlen(version));
4565 NFSM_BUILD(tl, uint32_t *, NFSX_V4TIME);
4566 verstime.tv_sec = 1293840000; /* Jan 1, 2011 */
4567 verstime.tv_nsec = 0;
4568 txdr_nfsv4time(&verstime, tl);
4569 nd->nd_flag |= ND_USEGSSNAME;
4570 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4571 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4572 NFSCL_DEBUG(1, "exchangeid err=%d reps=%d\n", error,
4573 (int)nd->nd_repstat);
4576 if (nd->nd_repstat == 0) {
4577 NFSM_DISSECT(tl, uint32_t *, 6 * NFSX_UNSIGNED + NFSX_HYPER);
4578 len = fxdr_unsigned(int, *(tl + 7));
4579 if (len < 0 || len > NFSV4_OPAQUELIMIT) {
4580 error = NFSERR_BADXDR;
4583 dsp = malloc(sizeof(struct nfsclds) + len + 1, M_NFSCLDS,
4585 dsp->nfsclds_expire = NFSD_MONOSEC + clp->nfsc_renew;
4586 dsp->nfsclds_servownlen = len;
4587 dsp->nfsclds_sess.nfsess_clientid.lval[0] = *tl++;
4588 dsp->nfsclds_sess.nfsess_clientid.lval[1] = *tl++;
4589 dsp->nfsclds_sess.nfsess_sequenceid =
4590 fxdr_unsigned(uint32_t, *tl++);
4591 v41flags = fxdr_unsigned(uint32_t, *tl);
4592 if ((v41flags & NFSV4EXCH_USEPNFSMDS) != 0 &&
4593 NFSHASPNFSOPT(nmp)) {
4594 NFSCL_DEBUG(1, "set PNFS\n");
4596 nmp->nm_state |= NFSSTA_PNFS;
4598 dsp->nfsclds_flags |= NFSCLDS_MDS;
4600 if ((v41flags & NFSV4EXCH_USEPNFSDS) != 0)
4601 dsp->nfsclds_flags |= NFSCLDS_DS;
4603 nd->nd_repstat = nfsrv_mtostr(nd,
4604 dsp->nfsclds_serverown, len);
4605 if (nd->nd_repstat == 0) {
4606 mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
4607 mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession",
4609 nfscl_initsessionslots(&dsp->nfsclds_sess);
4612 free(dsp, M_NFSCLDS);
4614 error = nd->nd_repstat;
4616 mbuf_freem(nd->nd_mrep);
4621 * Do the NFSv4.1 Create Session.
4624 nfsrpc_createsession(struct nfsmount *nmp, struct nfsclsession *sep,
4625 struct nfssockreq *nrp, uint32_t sequenceid, int mds, struct ucred *cred,
4628 uint32_t crflags, *tl;
4629 struct nfsrv_descript nfsd;
4630 struct nfsrv_descript *nd = &nfsd;
4633 nfscl_reqstart(nd, NFSPROC_CREATESESSION, nmp, NULL, 0, NULL, NULL);
4634 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
4635 *tl++ = sep->nfsess_clientid.lval[0];
4636 *tl++ = sep->nfsess_clientid.lval[1];
4637 *tl++ = txdr_unsigned(sequenceid);
4638 crflags = (NFSMNT_RDONLY(nmp->nm_mountp) ? 0 : NFSV4CRSESS_PERSIST);
4639 if (nfscl_enablecallb != 0 && nfs_numnfscbd > 0 && mds != 0)
4640 crflags |= NFSV4CRSESS_CONNBACKCHAN;
4641 *tl = txdr_unsigned(crflags);
4643 /* Fill in fore channel attributes. */
4644 NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4645 *tl++ = 0; /* Header pad size */
4646 *tl++ = txdr_unsigned(100000); /* Max request size */
4647 *tl++ = txdr_unsigned(100000); /* Max response size */
4648 *tl++ = txdr_unsigned(4096); /* Max response size cached */
4649 *tl++ = txdr_unsigned(20); /* Max operations */
4650 *tl++ = txdr_unsigned(64); /* Max slots */
4651 *tl = 0; /* No rdma ird */
4653 /* Fill in back channel attributes. */
4654 NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4655 *tl++ = 0; /* Header pad size */
4656 *tl++ = txdr_unsigned(10000); /* Max request size */
4657 *tl++ = txdr_unsigned(10000); /* Max response size */
4658 *tl++ = txdr_unsigned(4096); /* Max response size cached */
4659 *tl++ = txdr_unsigned(4); /* Max operations */
4660 *tl++ = txdr_unsigned(NFSV4_CBSLOTS); /* Max slots */
4661 *tl = 0; /* No rdma ird */
4663 NFSM_BUILD(tl, uint32_t *, 8 * NFSX_UNSIGNED);
4664 *tl++ = txdr_unsigned(NFS_CALLBCKPROG); /* Call back prog # */
4666 /* Allow AUTH_SYS callbacks as uid, gid == 0. */
4667 *tl++ = txdr_unsigned(1); /* Auth_sys only */
4668 *tl++ = txdr_unsigned(AUTH_SYS); /* AUTH_SYS type */
4669 *tl++ = txdr_unsigned(nfsboottime.tv_sec); /* time stamp */
4670 *tl++ = 0; /* Null machine name */
4671 *tl++ = 0; /* Uid == 0 */
4672 *tl++ = 0; /* Gid == 0 */
4673 *tl = 0; /* No additional gids */
4674 nd->nd_flag |= ND_USEGSSNAME;
4675 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred, NFS_PROG,
4676 NFS_VER4, NULL, 1, NULL, NULL);
4679 if (nd->nd_repstat == 0) {
4680 NFSM_DISSECT(tl, uint32_t *, NFSX_V4SESSIONID +
4682 bcopy(tl, sep->nfsess_sessionid, NFSX_V4SESSIONID);
4683 tl += NFSX_V4SESSIONID / NFSX_UNSIGNED;
4684 sep->nfsess_sequenceid = fxdr_unsigned(uint32_t, *tl++);
4685 crflags = fxdr_unsigned(uint32_t, *tl);
4686 if ((crflags & NFSV4CRSESS_PERSIST) != 0 && mds != 0) {
4688 nmp->nm_state |= NFSSTA_SESSPERSIST;
4692 /* Get the fore channel slot count. */
4693 NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4694 tl += 3; /* Skip the other counts. */
4695 sep->nfsess_maxcache = fxdr_unsigned(int, *tl++);
4697 sep->nfsess_foreslots = fxdr_unsigned(uint16_t, *tl++);
4698 NFSCL_DEBUG(4, "fore slots=%d\n", (int)sep->nfsess_foreslots);
4699 irdcnt = fxdr_unsigned(int, *tl);
4701 NFSM_DISSECT(tl, uint32_t *, irdcnt * NFSX_UNSIGNED);
4703 /* and the back channel slot count. */
4704 NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4706 sep->nfsess_backslots = fxdr_unsigned(uint16_t, *tl);
4707 NFSCL_DEBUG(4, "back slots=%d\n", (int)sep->nfsess_backslots);
4709 error = nd->nd_repstat;
4711 mbuf_freem(nd->nd_mrep);
4716 * Do the NFSv4.1 Destroy Session.
4719 nfsrpc_destroysession(struct nfsmount *nmp, struct nfsclclient *clp,
4720 struct ucred *cred, NFSPROC_T *p)
4723 struct nfsrv_descript nfsd;
4724 struct nfsrv_descript *nd = &nfsd;
4726 struct nfsclsession *tsep;
4728 nfscl_reqstart(nd, NFSPROC_DESTROYSESSION, nmp, NULL, 0, NULL, NULL);
4729 NFSM_BUILD(tl, uint32_t *, NFSX_V4SESSIONID);
4730 tsep = nfsmnt_mdssession(nmp);
4731 bcopy(tsep->nfsess_sessionid, tl, NFSX_V4SESSIONID);
4732 nd->nd_flag |= ND_USEGSSNAME;
4733 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4734 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4737 error = nd->nd_repstat;
4738 mbuf_freem(nd->nd_mrep);
4743 * Do the NFSv4.1 Destroy Client.
4746 nfsrpc_destroyclient(struct nfsmount *nmp, struct nfsclclient *clp,
4747 struct ucred *cred, NFSPROC_T *p)
4750 struct nfsrv_descript nfsd;
4751 struct nfsrv_descript *nd = &nfsd;
4753 struct nfsclsession *tsep;
4755 nfscl_reqstart(nd, NFSPROC_DESTROYCLIENT, nmp, NULL, 0, NULL, NULL);
4756 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4757 tsep = nfsmnt_mdssession(nmp);
4758 *tl++ = tsep->nfsess_clientid.lval[0];
4759 *tl = tsep->nfsess_clientid.lval[1];
4760 nd->nd_flag |= ND_USEGSSNAME;
4761 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4762 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4765 error = nd->nd_repstat;
4766 mbuf_freem(nd->nd_mrep);
4771 * Do the NFSv4.1 LayoutGet.
4774 nfsrpc_layoutget(struct nfsmount *nmp, uint8_t *fhp, int fhlen, int iomode,
4775 uint64_t offset, uint64_t len, uint64_t minlen, int layoutlen,
4776 nfsv4stateid_t *stateidp, int *retonclosep, struct nfsclflayouthead *flhp,
4777 struct ucred *cred, NFSPROC_T *p, void *stuff)
4780 struct nfsrv_descript nfsd, *nd = &nfsd;
4782 struct nfsclflayout *flp, *prevflp, *tflp;
4783 int cnt, error, gotiomode, fhcnt, nfhlen, i, j;
4789 nfscl_reqstart(nd, NFSPROC_LAYOUTGET, nmp, fhp, fhlen, NULL, NULL);
4790 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4792 *tl++ = newnfs_false; /* Don't signal availability. */
4793 *tl++ = txdr_unsigned(NFSLAYOUT_NFSV4_1_FILES);
4794 *tl++ = txdr_unsigned(iomode);
4795 txdr_hyper(offset, tl);
4797 txdr_hyper(len, tl);
4799 txdr_hyper(minlen, tl);
4801 *tl++ = txdr_unsigned(stateidp->seqid);
4802 NFSCL_DEBUG(4, "layget seq=%d\n", (int)stateidp->seqid);
4803 *tl++ = stateidp->other[0];
4804 *tl++ = stateidp->other[1];
4805 *tl++ = stateidp->other[2];
4806 *tl = txdr_unsigned(layoutlen);
4807 nd->nd_flag |= ND_USEGSSNAME;
4808 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4809 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4812 if (nd->nd_repstat == 0) {
4813 NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_STATEID);
4818 stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
4819 NFSCL_DEBUG(4, "retoncls=%d stseq=%d\n", *retonclosep,
4820 (int)stateidp->seqid);
4821 stateidp->other[0] = *tl++;
4822 stateidp->other[1] = *tl++;
4823 stateidp->other[2] = *tl++;
4824 cnt = fxdr_unsigned(int, *tl);
4825 NFSCL_DEBUG(4, "layg cnt=%d\n", cnt);
4826 if (cnt <= 0 || cnt > 10000) {
4827 /* Don't accept more than 10000 layouts in reply. */
4828 error = NFSERR_BADXDR;
4831 for (i = 0; i < cnt; i++) {
4832 /* Dissect all the way to the file handle cnt. */
4833 NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_HYPER +
4834 6 * NFSX_UNSIGNED + NFSX_V4DEVICEID);
4835 fhcnt = fxdr_unsigned(int, *(tl + 11 +
4836 NFSX_V4DEVICEID / NFSX_UNSIGNED));
4837 NFSCL_DEBUG(4, "fhcnt=%d\n", fhcnt);
4838 if (fhcnt < 0 || fhcnt > 100) {
4839 /* Don't accept more than 100 file handles. */
4840 error = NFSERR_BADXDR;
4844 flp = malloc(sizeof(*flp) + (fhcnt - 1) *
4845 sizeof(struct nfsfh *),
4846 M_NFSFLAYOUT, M_WAITOK);
4848 flp = malloc(sizeof(*flp),
4849 M_NFSFLAYOUT, M_WAITOK);
4850 flp->nfsfl_flags = 0;
4851 flp->nfsfl_fhcnt = 0;
4852 flp->nfsfl_devp = NULL;
4853 flp->nfsfl_off = fxdr_hyper(tl); tl += 2;
4854 retlen = fxdr_hyper(tl); tl += 2;
4855 if (flp->nfsfl_off + retlen < flp->nfsfl_off)
4856 flp->nfsfl_end = UINT64_MAX - flp->nfsfl_off;
4858 flp->nfsfl_end = flp->nfsfl_off + retlen;
4859 flp->nfsfl_iomode = fxdr_unsigned(int, *tl++);
4860 if (gotiomode == -1)
4861 gotiomode = flp->nfsfl_iomode;
4862 NFSCL_DEBUG(4, "layg reqiom=%d retiom=%d\n", iomode,
4863 (int)flp->nfsfl_iomode);
4864 if (fxdr_unsigned(int, *tl++) !=
4865 NFSLAYOUT_NFSV4_1_FILES) {
4866 printf("NFSv4.1: got non-files layout\n");
4867 error = NFSERR_BADXDR;
4870 NFSBCOPY(++tl, flp->nfsfl_dev, NFSX_V4DEVICEID);
4871 tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4872 flp->nfsfl_util = fxdr_unsigned(uint32_t, *tl++);
4873 NFSCL_DEBUG(4, "flutil=0x%x\n", flp->nfsfl_util);
4874 flp->nfsfl_stripe1 = fxdr_unsigned(uint32_t, *tl++);
4875 flp->nfsfl_patoff = fxdr_hyper(tl); tl += 2;
4876 if (fxdr_unsigned(int, *tl) != fhcnt) {
4877 printf("EEK! bad fhcnt\n");
4878 error = NFSERR_BADXDR;
4881 for (j = 0; j < fhcnt; j++) {
4882 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4883 nfhlen = fxdr_unsigned(int, *tl);
4884 if (nfhlen <= 0 || nfhlen > NFSX_V4FHMAX) {
4885 error = NFSERR_BADXDR;
4888 nfhp = malloc(sizeof(*nfhp) + nfhlen - 1,
4890 flp->nfsfl_fh[j] = nfhp;
4892 nfhp->nfh_len = nfhlen;
4893 NFSM_DISSECT(cp, uint8_t *, NFSM_RNDUP(nfhlen));
4894 NFSBCOPY(cp, nfhp->nfh_fh, nfhlen);
4896 if (flp->nfsfl_iomode == gotiomode) {
4897 /* Keep the list in increasing offset order. */
4898 tflp = LIST_FIRST(flhp);
4900 while (tflp != NULL &&
4901 tflp->nfsfl_off < flp->nfsfl_off) {
4903 tflp = LIST_NEXT(tflp, nfsfl_list);
4905 if (prevflp == NULL)
4906 LIST_INSERT_HEAD(flhp, flp, nfsfl_list);
4908 LIST_INSERT_AFTER(prevflp, flp,
4911 printf("nfscl_layoutget(): got wrong iomode\n");
4912 nfscl_freeflayout(flp);
4917 if (nd->nd_repstat != 0 && error == 0)
4918 error = nd->nd_repstat;
4920 if (error != 0 && flp != NULL)
4921 nfscl_freeflayout(flp);
4922 mbuf_freem(nd->nd_mrep);
4927 * Do the NFSv4.1 Get Device Info.
4930 nfsrpc_getdeviceinfo(struct nfsmount *nmp, uint8_t *deviceid, int layouttype,
4931 uint32_t *notifybitsp, struct nfscldevinfo **ndip, struct ucred *cred,
4935 struct nfsrv_descript nfsd;
4936 struct nfsrv_descript *nd = &nfsd;
4937 struct sockaddr_storage ss;
4938 struct nfsclds *dsp = NULL, **dspp;
4939 struct nfscldevinfo *ndi;
4940 int addrcnt, bitcnt, error, i, isudp, j, pos, safilled, stripecnt;
4941 uint8_t stripeindex;
4945 nfscl_reqstart(nd, NFSPROC_GETDEVICEINFO, nmp, NULL, 0, NULL, NULL);
4946 NFSM_BUILD(tl, uint32_t *, NFSX_V4DEVICEID + 3 * NFSX_UNSIGNED);
4947 NFSBCOPY(deviceid, tl, NFSX_V4DEVICEID);
4948 tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4949 *tl++ = txdr_unsigned(layouttype);
4950 *tl++ = txdr_unsigned(100000);
4951 if (notifybitsp != NULL && *notifybitsp != 0) {
4952 *tl = txdr_unsigned(1); /* One word of bits. */
4953 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
4954 *tl = txdr_unsigned(*notifybitsp);
4956 *tl = txdr_unsigned(0);
4957 nd->nd_flag |= ND_USEGSSNAME;
4958 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4959 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4962 if (nd->nd_repstat == 0) {
4963 NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4964 if (layouttype != fxdr_unsigned(int, *tl++))
4965 printf("EEK! devinfo layout type not same!\n");
4966 stripecnt = fxdr_unsigned(int, *++tl);
4967 NFSCL_DEBUG(4, "stripecnt=%d\n", stripecnt);
4968 if (stripecnt < 1 || stripecnt > 4096) {
4969 printf("NFS devinfo stripecnt %d: out of range\n",
4971 error = NFSERR_BADXDR;
4974 NFSM_DISSECT(tl, uint32_t *, (stripecnt + 1) * NFSX_UNSIGNED);
4975 addrcnt = fxdr_unsigned(int, *(tl + stripecnt));
4976 NFSCL_DEBUG(4, "addrcnt=%d\n", addrcnt);
4977 if (addrcnt < 1 || addrcnt > 128) {
4978 printf("NFS devinfo addrcnt %d: out of range\n",
4980 error = NFSERR_BADXDR;
4985 * Now we know how many stripe indices and addresses, so
4986 * we can allocate the structure the correct size.
4988 i = (stripecnt * sizeof(uint8_t)) / sizeof(struct nfsclds *)
4990 NFSCL_DEBUG(4, "stripeindices=%d\n", i);
4991 ndi = malloc(sizeof(*ndi) + (addrcnt + i) *
4992 sizeof(struct nfsclds *), M_NFSDEVINFO, M_WAITOK | M_ZERO);
4993 NFSBCOPY(deviceid, ndi->nfsdi_deviceid, NFSX_V4DEVICEID);
4994 ndi->nfsdi_refcnt = 0;
4995 ndi->nfsdi_stripecnt = stripecnt;
4996 ndi->nfsdi_addrcnt = addrcnt;
4997 /* Fill in the stripe indices. */
4998 for (i = 0; i < stripecnt; i++) {
4999 stripeindex = fxdr_unsigned(uint8_t, *tl++);
5000 NFSCL_DEBUG(4, "stripeind=%d\n", stripeindex);
5001 if (stripeindex >= addrcnt) {
5002 printf("NFS devinfo stripeindex %d: too big\n",
5004 error = NFSERR_BADXDR;
5007 nfsfldi_setstripeindex(ndi, i, stripeindex);
5010 /* Now, dissect the server address(es). */
5012 for (i = 0; i < addrcnt; i++) {
5013 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5014 cnt = fxdr_unsigned(uint32_t, *tl);
5016 printf("NFS devinfo 0 len addrlist\n");
5017 error = NFSERR_BADXDR;
5020 dspp = nfsfldi_addr(ndi, i);
5021 pos = arc4random() % cnt; /* Choose one. */
5023 for (j = 0; j < cnt; j++) {
5024 error = nfsv4_getipaddr(nd, &ss, &isudp);
5025 if (error != 0 && error != EPERM) {
5026 error = NFSERR_BADXDR;
5029 if (error == 0 && isudp == 0) {
5032 * - use "pos" entry if it is of the
5033 * same af_family or none of them
5034 * is of the same af_family
5036 * - use the first one of the same
5039 if ((safilled == 0 && ss.ss_family ==
5040 nmp->nm_nam->sa_family) ||
5042 (safilled == 0 || ss.ss_family ==
5043 nmp->nm_nam->sa_family)) ||
5044 (safilled == 1 && ss.ss_family ==
5045 nmp->nm_nam->sa_family)) {
5046 error = nfsrpc_fillsa(nmp, &ss,
5051 nmp->nm_nam->sa_family)
5063 /* And the notify bits. */
5064 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5065 if (safilled != 0) {
5066 bitcnt = fxdr_unsigned(int, *tl);
5068 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5069 if (notifybitsp != NULL)
5071 fxdr_unsigned(uint32_t, *tl);
5077 if (nd->nd_repstat != 0)
5078 error = nd->nd_repstat;
5080 if (error != 0 && ndi != NULL)
5081 nfscl_freedevinfo(ndi);
5082 mbuf_freem(nd->nd_mrep);
5087 * Do the NFSv4.1 LayoutCommit.
5090 nfsrpc_layoutcommit(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
5091 uint64_t off, uint64_t len, uint64_t lastbyte, nfsv4stateid_t *stateidp,
5092 int layouttype, int layoutupdatecnt, uint8_t *layp, struct ucred *cred,
5093 NFSPROC_T *p, void *stuff)
5096 struct nfsrv_descript nfsd, *nd = &nfsd;
5097 int error, outcnt, i;
5100 nfscl_reqstart(nd, NFSPROC_LAYOUTCOMMIT, nmp, fh, fhlen, NULL, NULL);
5101 NFSM_BUILD(tl, uint32_t *, 5 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
5103 txdr_hyper(off, tl);
5105 txdr_hyper(len, tl);
5108 *tl++ = newnfs_true;
5110 *tl++ = newnfs_false;
5111 *tl++ = txdr_unsigned(stateidp->seqid);
5112 *tl++ = stateidp->other[0];
5113 *tl++ = stateidp->other[1];
5114 *tl++ = stateidp->other[2];
5115 *tl++ = newnfs_true;
5118 else if (lastbyte >= (off + len))
5119 lastbyte = off + len - 1;
5120 txdr_hyper(lastbyte, tl);
5122 *tl++ = newnfs_false;
5123 *tl++ = txdr_unsigned(layouttype);
5124 *tl = txdr_unsigned(layoutupdatecnt);
5125 if (layoutupdatecnt > 0) {
5126 KASSERT(layouttype != NFSLAYOUT_NFSV4_1_FILES,
5127 ("Must be nil for Files Layout"));
5128 outcnt = NFSM_RNDUP(layoutupdatecnt);
5129 NFSM_BUILD(cp, uint8_t *, outcnt);
5130 NFSBCOPY(layp, cp, layoutupdatecnt);
5131 cp += layoutupdatecnt;
5132 for (i = 0; i < (outcnt - layoutupdatecnt); i++)
5135 nd->nd_flag |= ND_USEGSSNAME;
5136 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5137 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5140 error = nd->nd_repstat;
5141 mbuf_freem(nd->nd_mrep);
5146 * Do the NFSv4.1 LayoutReturn.
5149 nfsrpc_layoutreturn(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
5150 int layouttype, uint32_t iomode, int layoutreturn, uint64_t offset,
5151 uint64_t len, nfsv4stateid_t *stateidp, int layoutcnt, uint32_t *layp,
5152 struct ucred *cred, NFSPROC_T *p, void *stuff)
5155 struct nfsrv_descript nfsd, *nd = &nfsd;
5156 int error, outcnt, i;
5159 nfscl_reqstart(nd, NFSPROC_LAYOUTRETURN, nmp, fh, fhlen, NULL, NULL);
5160 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
5162 *tl++ = newnfs_true;
5164 *tl++ = newnfs_false;
5165 *tl++ = txdr_unsigned(layouttype);
5166 *tl++ = txdr_unsigned(iomode);
5167 *tl = txdr_unsigned(layoutreturn);
5168 if (layoutreturn == NFSLAYOUTRETURN_FILE) {
5169 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_HYPER + NFSX_STATEID +
5171 txdr_hyper(offset, tl);
5173 txdr_hyper(len, tl);
5175 NFSCL_DEBUG(4, "layoutret stseq=%d\n", (int)stateidp->seqid);
5176 *tl++ = txdr_unsigned(stateidp->seqid);
5177 *tl++ = stateidp->other[0];
5178 *tl++ = stateidp->other[1];
5179 *tl++ = stateidp->other[2];
5180 *tl = txdr_unsigned(layoutcnt);
5181 if (layoutcnt > 0) {
5182 outcnt = NFSM_RNDUP(layoutcnt);
5183 NFSM_BUILD(cp, uint8_t *, outcnt);
5184 NFSBCOPY(layp, cp, layoutcnt);
5186 for (i = 0; i < (outcnt - layoutcnt); i++)
5190 nd->nd_flag |= ND_USEGSSNAME;
5191 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5192 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5195 if (nd->nd_repstat == 0) {
5196 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5198 NFSM_DISSECT(tl, uint32_t *, NFSX_STATEID);
5199 stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
5200 stateidp->other[0] = *tl++;
5201 stateidp->other[1] = *tl++;
5202 stateidp->other[2] = *tl;
5205 error = nd->nd_repstat;
5207 mbuf_freem(nd->nd_mrep);
5212 * Acquire a layout and devinfo, if possible. The caller must have acquired
5213 * a reference count on the nfsclclient structure before calling this.
5214 * Return the layout in lypp with a reference count on it, if successful.
5217 nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
5218 int iomode, uint32_t *notifybitsp, nfsv4stateid_t *stateidp, uint64_t off,
5219 struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
5221 struct nfscllayout *lyp;
5222 struct nfsclflayout *flp, *tflp;
5223 struct nfscldevinfo *dip;
5224 struct nfsclflayouthead flh;
5225 int error = 0, islocked, layoutlen, recalled, retonclose;
5226 nfsv4stateid_t stateid;
5227 struct nfsclsession *tsep;
5231 * If lyp is returned non-NULL, there will be a refcnt (shared lock)
5232 * on it, iff flp != NULL or a lock (exclusive lock) on it iff
5235 lyp = nfscl_getlayout(nmp->nm_clp, nfhp->nfh_fh, nfhp->nfh_len,
5236 off, &flp, &recalled);
5238 if (lyp == NULL || flp == NULL) {
5242 tsep = nfsmnt_mdssession(nmp);
5243 layoutlen = tsep->nfsess_maxcache -
5244 (NFSX_STATEID + 3 * NFSX_UNSIGNED);
5247 stateid.other[0] = stateidp->other[0];
5248 stateid.other[1] = stateidp->other[1];
5249 stateid.other[2] = stateidp->other[2];
5250 error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5251 nfhp->nfh_len, iomode, (uint64_t)0, UINT64_MAX,
5252 (uint64_t)0, layoutlen, &stateid, &retonclose,
5253 &flh, cred, p, NULL);
5256 stateid.seqid = lyp->nfsly_stateid.seqid;
5257 stateid.other[0] = lyp->nfsly_stateid.other[0];
5258 stateid.other[1] = lyp->nfsly_stateid.other[1];
5259 stateid.other[2] = lyp->nfsly_stateid.other[2];
5260 error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5261 nfhp->nfh_len, iomode, off, UINT64_MAX,
5262 (uint64_t)0, layoutlen, &stateid, &retonclose,
5263 &flh, cred, p, NULL);
5266 LIST_FOREACH(tflp, &flh, nfsfl_list) {
5267 error = nfscl_adddevinfo(nmp, NULL, tflp);
5269 error = nfsrpc_getdeviceinfo(nmp,
5271 NFSLAYOUT_NFSV4_1_FILES,
5272 notifybitsp, &dip, cred, p);
5275 error = nfscl_adddevinfo(nmp, dip,
5279 "getlayout: cannot add\n");
5284 * nfscl_layout() always returns with the nfsly_lock
5285 * set to a refcnt (shared lock).
5287 error = nfscl_layout(nmp, vp, nfhp->nfh_fh,
5288 nfhp->nfh_len, &stateid, retonclose, &flh, &lyp,
5292 } else if (islocked != 0)
5293 nfsv4_unlock(&lyp->nfsly_lock, 0);
5300 * Do a TCP connection plus exchange id and create session.
5301 * If successful, a "struct nfsclds" is linked into the list for the
5302 * mount point and a pointer to it is returned.
5305 nfsrpc_fillsa(struct nfsmount *nmp, struct sockaddr_storage *ssp,
5306 struct nfsclds **dspp, NFSPROC_T *p)
5308 struct sockaddr_in *msad, *sad, *ssd;
5309 struct sockaddr_in6 *msad6, *sad6, *ssd6;
5310 struct nfsclclient *clp;
5311 struct nfssockreq *nrp;
5312 struct nfsclds *dsp, *tdsp;
5314 enum nfsclds_state retv;
5315 uint32_t sequenceid;
5317 KASSERT(nmp->nm_sockreq.nr_cred != NULL,
5318 ("nfsrpc_fillsa: NULL nr_cred"));
5324 if (ssp->ss_family == AF_INET) {
5325 ssd = (struct sockaddr_in *)ssp;
5329 * Check to see if we already have a session for this
5330 * address that is usable for a DS.
5331 * Note that the MDS's address is in a different place
5332 * than the sessions already acquired for DS's.
5334 msad = (struct sockaddr_in *)nmp->nm_sockreq.nr_nam;
5335 tdsp = TAILQ_FIRST(&nmp->nm_sess);
5336 while (tdsp != NULL) {
5337 if (msad != NULL && msad->sin_family == AF_INET &&
5338 ssd->sin_addr.s_addr == msad->sin_addr.s_addr &&
5339 ssd->sin_port == msad->sin_port &&
5340 (tdsp->nfsclds_flags & NFSCLDS_DS) != 0 &&
5341 tdsp->nfsclds_sess.nfsess_defunct == 0) {
5344 NFSCL_DEBUG(4, "fnd same addr\n");
5347 tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5348 if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5349 msad = (struct sockaddr_in *)
5350 tdsp->nfsclds_sockp->nr_nam;
5356 /* No IP address match, so look for new/trunked one. */
5357 sad = malloc(sizeof(*sad), M_SONAME, M_WAITOK | M_ZERO);
5358 sad->sin_len = sizeof(*sad);
5359 sad->sin_family = AF_INET;
5360 sad->sin_port = ssd->sin_port;
5361 sad->sin_addr.s_addr = ssd->sin_addr.s_addr;
5362 nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5363 nrp->nr_nam = (struct sockaddr *)sad;
5364 } else if (ssp->ss_family == AF_INET6) {
5365 ssd6 = (struct sockaddr_in6 *)ssp;
5369 * Check to see if we already have a session for this
5370 * address that is usable for a DS.
5371 * Note that the MDS's address is in a different place
5372 * than the sessions already acquired for DS's.
5374 msad6 = (struct sockaddr_in6 *)nmp->nm_sockreq.nr_nam;
5375 tdsp = TAILQ_FIRST(&nmp->nm_sess);
5376 while (tdsp != NULL) {
5377 if (msad6 != NULL && msad6->sin6_family == AF_INET6 &&
5378 IN6_ARE_ADDR_EQUAL(&ssd6->sin6_addr,
5379 &msad6->sin6_addr) &&
5380 ssd6->sin6_port == msad6->sin6_port &&
5381 (tdsp->nfsclds_flags & NFSCLDS_DS) != 0 &&
5382 tdsp->nfsclds_sess.nfsess_defunct == 0) {
5387 tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5388 if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5389 msad6 = (struct sockaddr_in6 *)
5390 tdsp->nfsclds_sockp->nr_nam;
5396 /* No IP address match, so look for new/trunked one. */
5397 sad6 = malloc(sizeof(*sad6), M_SONAME, M_WAITOK | M_ZERO);
5398 sad6->sin6_len = sizeof(*sad6);
5399 sad6->sin6_family = AF_INET6;
5400 sad6->sin6_port = ssd6->sin6_port;
5401 NFSBCOPY(&ssd6->sin6_addr, &sad6->sin6_addr,
5402 sizeof(struct in6_addr));
5403 nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5404 nrp->nr_nam = (struct sockaddr *)sad6;
5408 nrp->nr_sotype = SOCK_STREAM;
5409 mtx_init(&nrp->nr_mtx, "nfssock", NULL, MTX_DEF);
5410 nrp->nr_prog = NFS_PROG;
5411 nrp->nr_vers = NFS_VER4;
5414 * Use the credentials that were used for the mount, which are
5415 * in nmp->nm_sockreq.nr_cred for newnfs_connect() etc.
5416 * Ref. counting the credentials with crhold() is probably not
5417 * necessary, since nm_sockreq.nr_cred won't be crfree()'d until
5418 * unmount, but I did it anyhow.
5420 nrp->nr_cred = crhold(nmp->nm_sockreq.nr_cred);
5421 error = newnfs_connect(nmp, nrp, NULL, p, 0);
5422 NFSCL_DEBUG(3, "DS connect=%d\n", error);
5424 /* Now, do the exchangeid and create session. */
5426 error = nfsrpc_exchangeid(nmp, clp, nrp, NFSV4EXCH_USEPNFSDS,
5427 &dsp, nrp->nr_cred, p);
5428 NFSCL_DEBUG(3, "DS exchangeid=%d\n", error);
5430 newnfs_disconnect(nrp);
5433 dsp->nfsclds_sockp = nrp;
5435 retv = nfscl_getsameserver(nmp, dsp, &tdsp);
5436 NFSCL_DEBUG(3, "getsame ret=%d\n", retv);
5437 if (retv == NFSDSP_USETHISSESSION) {
5440 * If there is already a session for this server,
5443 (void)newnfs_disconnect(nrp);
5444 nfscl_freenfsclds(dsp);
5448 if (retv == NFSDSP_SEQTHISSESSION)
5449 sequenceid = tdsp->nfsclds_sess.nfsess_sequenceid;
5451 sequenceid = dsp->nfsclds_sess.nfsess_sequenceid;
5453 error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
5454 nrp, sequenceid, 0, nrp->nr_cred, p);
5455 NFSCL_DEBUG(3, "DS createsess=%d\n", error);
5457 NFSFREECRED(nrp->nr_cred);
5458 NFSFREEMUTEX(&nrp->nr_mtx);
5459 free(nrp->nr_nam, M_SONAME);
5460 free(nrp, M_NFSSOCKREQ);
5463 NFSCL_DEBUG(3, "add DS session\n");
5465 * Put it at the end of the list. That way the list
5466 * is ordered by when the entry was added. This matters
5467 * since the one done first is the one that should be
5468 * used for sequencid'ing any subsequent create sessions.
5471 TAILQ_INSERT_TAIL(&nmp->nm_sess, dsp, nfsclds_list);
5474 } else if (dsp != NULL) {
5475 newnfs_disconnect(nrp);
5476 nfscl_freenfsclds(dsp);
5482 * Do the NFSv4.1 Reclaim Complete.
5485 nfsrpc_reclaimcomplete(struct nfsmount *nmp, struct ucred *cred, NFSPROC_T *p)
5488 struct nfsrv_descript nfsd;
5489 struct nfsrv_descript *nd = &nfsd;
5492 nfscl_reqstart(nd, NFSPROC_RECLAIMCOMPL, nmp, NULL, 0, NULL, NULL);
5493 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
5495 nd->nd_flag |= ND_USEGSSNAME;
5496 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5497 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5500 error = nd->nd_repstat;
5501 mbuf_freem(nd->nd_mrep);
5506 * Initialize the slot tables for a session.
5509 nfscl_initsessionslots(struct nfsclsession *sep)
5513 for (i = 0; i < NFSV4_CBSLOTS; i++) {
5514 if (sep->nfsess_cbslots[i].nfssl_reply != NULL)
5515 m_freem(sep->nfsess_cbslots[i].nfssl_reply);
5516 NFSBZERO(&sep->nfsess_cbslots[i], sizeof(struct nfsslot));
5518 for (i = 0; i < 64; i++)
5519 sep->nfsess_slotseq[i] = 0;
5520 sep->nfsess_slots = 0;
5524 * Called to try and do an I/O operation via an NFSv4.1 Data Server (DS).
5527 nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5528 uint32_t rwaccess, struct ucred *cred, NFSPROC_T *p)
5530 struct nfsnode *np = VTONFS(vp);
5531 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5532 struct nfscllayout *layp;
5533 struct nfscldevinfo *dip;
5534 struct nfsclflayout *rflp;
5535 nfsv4stateid_t stateid;
5536 struct ucred *newcred;
5537 uint64_t lastbyte, len, off, oresid, xfer;
5538 int eof, error, iolaymode, recalled;
5541 if (!NFSHASPNFS(nmp) || nfscl_enablecallb == 0 || nfs_numnfscbd == 0 ||
5542 (np->n_flag & NNOLAYOUT) != 0)
5544 /* Now, get a reference cnt on the clientid for this mount. */
5545 if (nfscl_getref(nmp) == 0)
5548 /* Find an appropriate stateid. */
5549 newcred = NFSNEWCRED(cred);
5550 error = nfscl_getstateid(vp, np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
5551 rwaccess, 1, newcred, p, &stateid, &lckp);
5553 NFSFREECRED(newcred);
5557 /* Search for a layout for this file. */
5558 off = uiop->uio_offset;
5559 layp = nfscl_getlayout(nmp->nm_clp, np->n_fhp->nfh_fh,
5560 np->n_fhp->nfh_len, off, &rflp, &recalled);
5561 if (layp == NULL || rflp == NULL) {
5562 if (recalled != 0) {
5563 NFSFREECRED(newcred);
5568 nfscl_rellayout(layp, (rflp == NULL) ? 1 : 0);
5571 /* Try and get a Layout, if it is supported. */
5572 if (rwaccess == NFSV4OPEN_ACCESSWRITE ||
5573 (np->n_flag & NWRITEOPENED) != 0)
5574 iolaymode = NFSLAYOUTIOMODE_RW;
5576 iolaymode = NFSLAYOUTIOMODE_READ;
5577 error = nfsrpc_getlayout(nmp, vp, np->n_fhp, iolaymode,
5578 NULL, &stateid, off, &layp, newcred, p);
5581 np->n_flag |= NNOLAYOUT;
5584 nfscl_lockderef(lckp);
5585 NFSFREECRED(newcred);
5587 nfscl_rellayout(layp, 0);
5594 * Loop around finding a layout that works for the first part of
5595 * this I/O operation, and then call the function that actually
5599 len = (uint64_t)uiop->uio_resid;
5600 while (len > 0 && error == 0 && eof == 0) {
5601 off = uiop->uio_offset;
5602 error = nfscl_findlayoutforio(layp, off, rwaccess, &rflp);
5604 oresid = xfer = (uint64_t)uiop->uio_resid;
5605 if (xfer > (rflp->nfsfl_end - rflp->nfsfl_off))
5606 xfer = rflp->nfsfl_end - rflp->nfsfl_off;
5607 dip = nfscl_getdevinfo(nmp->nm_clp, rflp->nfsfl_dev,
5610 error = nfscl_doflayoutio(vp, uiop, iomode,
5611 must_commit, &eof, &stateid, rwaccess, dip,
5612 layp, rflp, off, xfer, newcred, p);
5613 nfscl_reldevinfo(dip);
5614 lastbyte = off + xfer - 1;
5617 if (lastbyte > layp->nfsly_lastbyte)
5618 layp->nfsly_lastbyte = lastbyte;
5620 } else if (error == NFSERR_OPENMODE &&
5621 rwaccess == NFSV4OPEN_ACCESSREAD) {
5623 nmp->nm_state |= NFSSTA_OPENMODE;
5629 len -= (oresid - (uint64_t)uiop->uio_resid);
5633 nfscl_lockderef(lckp);
5634 NFSFREECRED(newcred);
5635 nfscl_rellayout(layp, 0);
5641 * Find a file layout that will handle the first bytes of the requested
5642 * range and return the information from it needed to to the I/O operation.
5645 nfscl_findlayoutforio(struct nfscllayout *lyp, uint64_t off, uint32_t rwaccess,
5646 struct nfsclflayout **retflpp)
5648 struct nfsclflayout *flp, *nflp, *rflp;
5653 /* For reading, do the Read list first and then the Write list. */
5655 if (rw == NFSV4OPEN_ACCESSREAD)
5656 flp = LIST_FIRST(&lyp->nfsly_flayread);
5658 flp = LIST_FIRST(&lyp->nfsly_flayrw);
5659 while (flp != NULL) {
5660 nflp = LIST_NEXT(flp, nfsfl_list);
5661 if (flp->nfsfl_off > off)
5663 if (flp->nfsfl_end > off &&
5664 (rflp == NULL || rflp->nfsfl_end < flp->nfsfl_end))
5668 if (rw == NFSV4OPEN_ACCESSREAD)
5669 rw = NFSV4OPEN_ACCESSWRITE;
5674 /* This one covers the most bytes starting at off. */
5682 * Do I/O using an NFSv4.1 file layout.
5685 nfscl_doflayoutio(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5686 int *eofp, nfsv4stateid_t *stateidp, int rwflag, struct nfscldevinfo *dp,
5687 struct nfscllayout *lyp, struct nfsclflayout *flp, uint64_t off,
5688 uint64_t len, struct ucred *cred, NFSPROC_T *p)
5690 uint64_t io_off, rel_off, stripe_unit_size, transfer, xfer;
5691 int commit_thru_mds, error = 0, stripe_index, stripe_pos;
5694 struct nfsclds **dspp;
5697 rel_off = off - flp->nfsfl_patoff;
5698 stripe_unit_size = (flp->nfsfl_util >> 6) & 0x3ffffff;
5699 stripe_pos = (rel_off / stripe_unit_size + flp->nfsfl_stripe1) %
5700 dp->nfsdi_stripecnt;
5701 transfer = stripe_unit_size - (rel_off % stripe_unit_size);
5703 /* Loop around, doing I/O for each stripe unit. */
5704 while (len > 0 && error == 0) {
5705 stripe_index = nfsfldi_stripeindex(dp, stripe_pos);
5706 dspp = nfsfldi_addr(dp, stripe_index);
5711 if ((flp->nfsfl_util & NFSFLAYUTIL_DENSE) != 0) {
5713 if (stripe_pos >= flp->nfsfl_fhcnt)
5715 fhp = flp->nfsfl_fh[stripe_pos];
5716 io_off = (rel_off / (stripe_unit_size *
5717 dp->nfsdi_stripecnt)) * stripe_unit_size +
5718 rel_off % stripe_unit_size;
5720 /* Sparse layout. */
5721 if (flp->nfsfl_fhcnt > 1) {
5722 if (stripe_index >= flp->nfsfl_fhcnt)
5724 fhp = flp->nfsfl_fh[stripe_index];
5725 } else if (flp->nfsfl_fhcnt == 1)
5726 fhp = flp->nfsfl_fh[0];
5731 if ((flp->nfsfl_util & NFSFLAYUTIL_COMMIT_THRU_MDS) != 0)
5732 commit_thru_mds = 1;
5734 commit_thru_mds = 0;
5735 if (rwflag == FREAD)
5736 error = nfsrpc_readds(vp, uiop, stateidp, eofp, *dspp,
5737 io_off, xfer, fhp, cred, p);
5739 error = nfsrpc_writeds(vp, uiop, iomode, must_commit,
5740 stateidp, *dspp, io_off, xfer, fhp, commit_thru_mds,
5744 lyp->nfsly_flags |= NFSLY_WRITTEN;
5749 transfer = stripe_unit_size;
5750 stripe_pos = (stripe_pos + 1) % dp->nfsdi_stripecnt;
5759 * The actual read RPC done to a DS.
5762 nfsrpc_readds(vnode_t vp, struct uio *uiop, nfsv4stateid_t *stateidp, int *eofp,
5763 struct nfsclds *dsp, uint64_t io_off, int len, struct nfsfh *fhp,
5764 struct ucred *cred, NFSPROC_T *p)
5768 struct nfsrv_descript nfsd;
5769 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5770 struct nfsrv_descript *nd = &nfsd;
5771 struct nfssockreq *nrp;
5774 nfscl_reqstart(nd, NFSPROC_READDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5775 NULL, &dsp->nfsclds_sess);
5776 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5777 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED * 3);
5778 txdr_hyper(io_off, tl);
5779 *(tl + 2) = txdr_unsigned(len);
5780 nrp = dsp->nfsclds_sockp;
5782 /* If NULL, use the MDS socket. */
5783 nrp = &nmp->nm_sockreq;
5784 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5785 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5788 if (nd->nd_repstat != 0) {
5789 error = nd->nd_repstat;
5792 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5793 *eofp = fxdr_unsigned(int, *tl);
5794 NFSM_STRSIZ(retlen, len);
5795 error = nfsm_mbufuio(nd, uiop, retlen);
5797 if (nd->nd_mrep != NULL)
5798 mbuf_freem(nd->nd_mrep);
5803 * The actual write RPC done to a DS.
5806 nfsrpc_writeds(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5807 nfsv4stateid_t *stateidp, struct nfsclds *dsp, uint64_t io_off, int len,
5808 struct nfsfh *fhp, int commit_thru_mds, struct ucred *cred, NFSPROC_T *p)
5811 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5812 int error, rlen, commit, committed = NFSWRITE_FILESYNC;
5814 struct nfsrv_descript nfsd;
5815 struct nfsrv_descript *nd = &nfsd;
5816 struct nfssockreq *nrp;
5818 KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
5820 nfscl_reqstart(nd, NFSPROC_WRITEDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5821 NULL, &dsp->nfsclds_sess);
5822 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5823 NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + 2 * NFSX_UNSIGNED);
5824 txdr_hyper(io_off, tl);
5826 *tl++ = txdr_unsigned(*iomode);
5827 *tl = txdr_unsigned(len);
5828 nfsm_uiombuf(nd, uiop, len);
5829 nrp = dsp->nfsclds_sockp;
5831 /* If NULL, use the MDS socket. */
5832 nrp = &nmp->nm_sockreq;
5833 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5834 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5837 if (nd->nd_repstat != 0) {
5839 * In case the rpc gets retried, roll
5840 * the uio fileds changed by nfsm_uiombuf()
5843 uiop->uio_offset -= len;
5844 uio_uio_resid_add(uiop, len);
5845 uio_iov_base_add(uiop, -len);
5846 uio_iov_len_add(uiop, len);
5847 error = nd->nd_repstat;
5849 NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_VERF);
5850 rlen = fxdr_unsigned(int, *tl++);
5854 } else if (rlen < len) {
5855 backup = len - rlen;
5856 uio_iov_base_add(uiop, -(backup));
5857 uio_iov_len_add(uiop, backup);
5858 uiop->uio_offset -= backup;
5859 uio_uio_resid_add(uiop, backup);
5862 commit = fxdr_unsigned(int, *tl++);
5865 * Return the lowest commitment level
5866 * obtained by any of the RPCs.
5868 if (committed == NFSWRITE_FILESYNC)
5870 else if (committed == NFSWRITE_DATASYNC &&
5871 commit == NFSWRITE_UNSTABLE)
5873 if (commit_thru_mds != 0) {
5875 if (!NFSHASWRITEVERF(nmp)) {
5876 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5877 NFSSETWRITEVERF(nmp);
5878 } else if (NFSBCMP(tl, nmp->nm_verf, NFSX_VERF)) {
5880 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5885 if ((dsp->nfsclds_flags & NFSCLDS_HASWRITEVERF) == 0) {
5886 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5887 dsp->nfsclds_flags |= NFSCLDS_HASWRITEVERF;
5888 } else if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5890 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5896 if (nd->nd_mrep != NULL)
5897 mbuf_freem(nd->nd_mrep);
5898 *iomode = committed;
5899 if (nd->nd_repstat != 0 && error == 0)
5900 error = nd->nd_repstat;
5905 * Free up the nfsclds structure.
5908 nfscl_freenfsclds(struct nfsclds *dsp)
5914 if (dsp->nfsclds_sockp != NULL) {
5915 NFSFREECRED(dsp->nfsclds_sockp->nr_cred);
5916 NFSFREEMUTEX(&dsp->nfsclds_sockp->nr_mtx);
5917 free(dsp->nfsclds_sockp->nr_nam, M_SONAME);
5918 free(dsp->nfsclds_sockp, M_NFSSOCKREQ);
5920 NFSFREEMUTEX(&dsp->nfsclds_mtx);
5921 NFSFREEMUTEX(&dsp->nfsclds_sess.nfsess_mtx);
5922 for (i = 0; i < NFSV4_CBSLOTS; i++) {
5923 if (dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply != NULL)
5925 dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply);
5927 free(dsp, M_NFSCLDS);
5930 static enum nfsclds_state
5931 nfscl_getsameserver(struct nfsmount *nmp, struct nfsclds *newdsp,
5932 struct nfsclds **retdspp)
5934 struct nfsclds *dsp, *cur_dsp;
5937 * Search the list of nfsclds structures for one with the same
5941 TAILQ_FOREACH(dsp, &nmp->nm_sess, nfsclds_list) {
5942 if (dsp->nfsclds_servownlen == newdsp->nfsclds_servownlen &&
5943 dsp->nfsclds_servownlen != 0 &&
5944 !NFSBCMP(dsp->nfsclds_serverown, newdsp->nfsclds_serverown,
5945 dsp->nfsclds_servownlen) &&
5946 dsp->nfsclds_sess.nfsess_defunct == 0) {
5947 NFSCL_DEBUG(4, "fnd same fdsp=%p dsp=%p flg=0x%x\n",
5948 TAILQ_FIRST(&nmp->nm_sess), dsp,
5949 dsp->nfsclds_flags);
5950 /* Server major id matches. */
5951 if ((dsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5953 return (NFSDSP_USETHISSESSION);
5957 * Note the first match, so it can be used for
5958 * sequence'ing new sessions.
5960 if (cur_dsp == NULL)
5964 if (cur_dsp != NULL) {
5966 return (NFSDSP_SEQTHISSESSION);
5968 return (NFSDSP_NOTFOUND);
5973 * NFS commit rpc to a DS.
5976 nfsrpc_commitds(vnode_t vp, uint64_t offset, int cnt, struct nfsclds *dsp,
5977 struct nfsfh *fhp, struct ucred *cred, NFSPROC_T *p, void *stuff)
5980 struct nfsrv_descript nfsd, *nd = &nfsd;
5981 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5982 struct nfssockreq *nrp;
5985 nfscl_reqstart(nd, NFSPROC_COMMITDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5986 NULL, &dsp->nfsclds_sess);
5987 NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + NFSX_UNSIGNED);
5988 txdr_hyper(offset, tl);
5990 *tl = txdr_unsigned(cnt);
5991 nrp = dsp->nfsclds_sockp;
5993 /* If NULL, use the MDS socket. */
5994 nrp = &nmp->nm_sockreq;
5995 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5996 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5999 if (nd->nd_repstat == 0) {
6000 NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
6002 if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
6003 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
6004 error = NFSERR_STALEWRITEVERF;
6009 if (error == 0 && nd->nd_repstat != 0)
6010 error = nd->nd_repstat;
6011 mbuf_freem(nd->nd_mrep);