2 * Copyright (c) 1989, 1993
3 * The Regents of the University of California. All rights reserved.
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 4. Neither the name of the University nor the names of its contributors
17 * may be used to endorse or promote products derived from this software
18 * without specific prior written permission.
20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 #include <sys/cdefs.h>
35 __FBSDID("$FreeBSD$");
38 * Rpc op calls, generally called from the vnode op calls or through the
39 * buffer cache, for NFS v2, 3 and 4.
40 * These do not normally make any changes to vnode arguments or use
41 * structures that might change between the VFS variants. The returned
42 * arguments are all at the end, after the NFSPROC_T *p one.
46 #include "opt_inet6.h"
48 #include <fs/nfs/nfsport.h>
53 extern int nfs_numnfscbd;
54 extern struct timeval nfsboottime;
55 extern u_int32_t newnfs_false, newnfs_true;
56 extern nfstype nfsv34_type[9];
57 extern int nfsrv_useacl;
58 extern char nfsv4_callbackaddr[INET6_ADDRSTRLEN];
59 extern int nfscl_debuglevel;
61 int nfstest_outofseq = 0;
62 int nfscl_assumeposixlocks = 1;
63 int nfscl_enablecallb = 0;
64 short nfsv4_cbport = NFSV4_CBPORT;
65 int nfstest_openallsetattr = 0;
66 #endif /* !APPLEKEXT */
68 #define DIRHDSIZ (sizeof (struct dirent) - (MAXNAMLEN + 1))
71 * nfscl_getsameserver() can return one of three values:
72 * NFSDSP_USETHISSESSION - Use this session for the DS.
73 * NFSDSP_SEQTHISSESSION - Use the nfsclds_sequence field of this dsp for new
75 * NFSDSP_NOTFOUND - No matching server was found.
78 NFSDSP_USETHISSESSION = 0,
79 NFSDSP_SEQTHISSESSION = 1,
83 static int nfsrpc_setattrrpc(vnode_t , struct vattr *, nfsv4stateid_t *,
84 struct ucred *, NFSPROC_T *, struct nfsvattr *, int *, void *);
85 static int nfsrpc_readrpc(vnode_t , struct uio *, struct ucred *,
86 nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *, void *);
87 static int nfsrpc_writerpc(vnode_t , struct uio *, int *, int *,
88 struct ucred *, nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *,
90 static int nfsrpc_createv23(vnode_t , char *, int, struct vattr *,
91 nfsquad_t, int, struct ucred *, NFSPROC_T *, struct nfsvattr *,
92 struct nfsvattr *, struct nfsfh **, int *, int *, void *);
93 static int nfsrpc_createv4(vnode_t , char *, int, struct vattr *,
94 nfsquad_t, int, struct nfsclowner *, struct nfscldeleg **, struct ucred *,
95 NFSPROC_T *, struct nfsvattr *, struct nfsvattr *, struct nfsfh **, int *,
96 int *, void *, int *);
97 static int nfsrpc_locku(struct nfsrv_descript *, struct nfsmount *,
98 struct nfscllockowner *, u_int64_t, u_int64_t,
99 u_int32_t, struct ucred *, NFSPROC_T *, int);
100 static int nfsrpc_setaclrpc(vnode_t, struct ucred *, NFSPROC_T *,
101 struct acl *, nfsv4stateid_t *, void *);
102 static int nfsrpc_getlayout(struct nfsmount *, vnode_t, struct nfsfh *, int,
103 uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
104 struct ucred *, NFSPROC_T *);
105 static int nfsrpc_fillsa(struct nfsmount *, struct sockaddr_storage *,
106 struct nfsclds **, NFSPROC_T *);
107 static void nfscl_initsessionslots(struct nfsclsession *);
108 static int nfscl_doflayoutio(vnode_t, struct uio *, int *, int *, int *,
109 nfsv4stateid_t *, int, struct nfscldevinfo *, struct nfscllayout *,
110 struct nfsclflayout *, uint64_t, uint64_t, struct ucred *, NFSPROC_T *);
111 static int nfsrpc_readds(vnode_t, struct uio *, nfsv4stateid_t *, int *,
112 struct nfsclds *, uint64_t, int, struct nfsfh *, struct ucred *,
114 static int nfsrpc_writeds(vnode_t, struct uio *, int *, int *,
115 nfsv4stateid_t *, struct nfsclds *, uint64_t, int,
116 struct nfsfh *, int, struct ucred *, NFSPROC_T *);
117 static enum nfsclds_state nfscl_getsameserver(struct nfsmount *,
118 struct nfsclds *, struct nfsclds **);
120 static int nfsrpc_commitds(vnode_t, uint64_t, int, struct nfsclds *,
121 struct nfsfh *, struct ucred *, NFSPROC_T *, void *);
125 * nfs null call from vfs.
128 nfsrpc_null(vnode_t vp, struct ucred *cred, NFSPROC_T *p)
131 struct nfsrv_descript nfsd, *nd = &nfsd;
133 NFSCL_REQSTART(nd, NFSPROC_NULL, vp);
134 error = nfscl_request(nd, vp, p, cred, NULL);
135 if (nd->nd_repstat && !error)
136 error = nd->nd_repstat;
137 mbuf_freem(nd->nd_mrep);
143 * For nfs version 3 and 4, use the access rpc to check accessibility. If file
144 * modes are changed on the server, accesses might still fail later.
147 nfsrpc_access(vnode_t vp, int acmode, struct ucred *cred,
148 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp)
151 u_int32_t mode, rmode;
154 mode = NFSACCESS_READ;
157 if (vnode_vtype(vp) == VDIR) {
159 mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND |
162 mode |= NFSACCESS_LOOKUP;
165 mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND);
167 mode |= NFSACCESS_EXECUTE;
171 * Now, just call nfsrpc_accessrpc() to do the actual RPC.
173 error = nfsrpc_accessrpc(vp, mode, cred, p, nap, attrflagp, &rmode,
177 * The NFS V3 spec does not clarify whether or not
178 * the returned access bits can be a superset of
179 * the ones requested, so...
181 if (!error && (rmode & mode) != mode)
187 * The actual rpc, separated out for Darwin.
190 nfsrpc_accessrpc(vnode_t vp, u_int32_t mode, struct ucred *cred,
191 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, u_int32_t *rmodep,
195 u_int32_t supported, rmode;
197 struct nfsrv_descript nfsd, *nd = &nfsd;
198 nfsattrbit_t attrbits;
202 NFSCL_REQSTART(nd, NFSPROC_ACCESS, vp);
203 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
204 *tl = txdr_unsigned(mode);
205 if (nd->nd_flag & ND_NFSV4) {
207 * And do a Getattr op.
209 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
210 *tl = txdr_unsigned(NFSV4OP_GETATTR);
211 NFSGETATTR_ATTRBIT(&attrbits);
212 (void) nfsrv_putattrbit(nd, &attrbits);
214 error = nfscl_request(nd, vp, p, cred, stuff);
217 if (nd->nd_flag & ND_NFSV3) {
218 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
222 if (!nd->nd_repstat) {
223 if (nd->nd_flag & ND_NFSV4) {
224 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
225 supported = fxdr_unsigned(u_int32_t, *tl++);
227 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
229 rmode = fxdr_unsigned(u_int32_t, *tl);
230 if (nd->nd_flag & ND_NFSV4)
231 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
234 * It's not obvious what should be done about
235 * unsupported access modes. For now, be paranoid
236 * and clear the unsupported ones.
241 error = nd->nd_repstat;
243 mbuf_freem(nd->nd_mrep);
251 nfsrpc_open(vnode_t vp, int amode, struct ucred *cred, NFSPROC_T *p)
253 struct nfsclopen *op;
254 struct nfscldeleg *dp;
256 struct nfsnode *np = VTONFS(vp);
257 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
258 u_int32_t mode, clidrev;
259 int ret, newone, error, expireret = 0, retrycnt;
262 * For NFSv4, Open Ops are only done on Regular Files.
264 if (vnode_vtype(vp) != VREG)
268 mode |= NFSV4OPEN_ACCESSREAD;
270 mode |= NFSV4OPEN_ACCESSWRITE;
275 { char name[100]; int namel;
276 namel = (np->n_v4->n4_namelen < 100) ? np->n_v4->n4_namelen : 99;
277 bcopy(NFS4NODENAME(np->n_v4), name, namel);
279 printf("rpcopen p=0x%x name=%s",p->p_pid,name);
280 if (nfhp->nfh_len > 0) printf(" fh=0x%x\n",nfhp->nfh_fh[12]);
281 else printf(" fhl=0\n");
286 error = nfscl_open(vp, nfhp->nfh_fh, nfhp->nfh_len, mode, 1,
287 cred, p, NULL, &op, &newone, &ret, 1);
291 if (nmp->nm_clp != NULL)
292 clidrev = nmp->nm_clp->nfsc_clientidrev;
295 if (ret == NFSCLOPEN_DOOPEN) {
296 if (np->n_v4 != NULL) {
297 error = nfsrpc_openrpc(nmp, vp, np->n_v4->n4_data,
298 np->n_v4->n4_fhlen, np->n_fhp->nfh_fh,
299 np->n_fhp->nfh_len, mode, op,
300 NFS4NODENAME(np->n_v4), np->n_v4->n4_namelen, &dp,
301 0, 0x0, cred, p, 0, 0);
304 OSBitAndAtomic((int32_t)~NDELEGMOD, (UInt32 *)&np->n_flag);
307 np->n_flag &= ~NDELEGMOD;
309 * Invalidate the attribute cache, so that
310 * attributes that pre-date the issue of a
311 * delegation are not cached, since the
312 * cached attributes will remain valid while
313 * the delegation is held.
315 NFSINVALATTRCACHE(np);
318 (void) nfscl_deleg(nmp->nm_mountp,
319 op->nfso_own->nfsow_clp,
320 nfhp->nfh_fh, nfhp->nfh_len, cred, p, &dp);
325 newnfs_copyincred(cred, &op->nfso_cred);
326 } else if (ret == NFSCLOPEN_SETCRED)
328 * This is a new local open on a delegation. It needs
329 * to have credentials so that an open can be done
330 * against the server during recovery.
332 newnfs_copyincred(cred, &op->nfso_cred);
335 * nfso_opencnt is the count of how many VOP_OPEN()s have
336 * been done on this Open successfully and a VOP_CLOSE()
337 * is expected for each of these.
338 * If error is non-zero, don't increment it, since the Open
339 * hasn't succeeded yet.
343 nfscl_openrelease(op, error, newone);
344 if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
345 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
346 error == NFSERR_BADSESSION) {
347 (void) nfs_catnap(PZERO, error, "nfs_open");
348 } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
350 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
353 } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
354 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
355 error == NFSERR_BADSESSION ||
356 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
357 expireret == 0 && clidrev != 0 && retrycnt < 4));
358 if (error && retrycnt >= 4)
364 * the actual open rpc
367 nfsrpc_openrpc(struct nfsmount *nmp, vnode_t vp, u_int8_t *nfhp, int fhlen,
368 u_int8_t *newfhp, int newfhlen, u_int32_t mode, struct nfsclopen *op,
369 u_int8_t *name, int namelen, struct nfscldeleg **dpp,
370 int reclaim, u_int32_t delegtype, struct ucred *cred, NFSPROC_T *p,
371 int syscred, int recursed)
374 struct nfsrv_descript nfsd, *nd = &nfsd;
375 struct nfscldeleg *dp, *ndp = NULL;
376 struct nfsvattr nfsva;
377 u_int32_t rflags, deleg;
378 nfsattrbit_t attrbits;
379 int error, ret, acesize, limitby;
383 nfscl_reqstart(nd, NFSPROC_OPEN, nmp, nfhp, fhlen, NULL, NULL);
384 NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
385 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
386 *tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
387 *tl++ = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
388 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
389 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
390 (void) nfsm_strtom(nd, op->nfso_own->nfsow_owner, NFSV4CL_LOCKNAMELEN);
391 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
392 *tl++ = txdr_unsigned(NFSV4OPEN_NOCREATE);
394 *tl = txdr_unsigned(NFSV4OPEN_CLAIMPREVIOUS);
395 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
396 *tl = txdr_unsigned(delegtype);
399 *tl = txdr_unsigned(NFSV4OPEN_CLAIMDELEGATECUR);
400 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
401 if (NFSHASNFSV4N(nmp))
404 *tl++ = dp->nfsdl_stateid.seqid;
405 *tl++ = dp->nfsdl_stateid.other[0];
406 *tl++ = dp->nfsdl_stateid.other[1];
407 *tl = dp->nfsdl_stateid.other[2];
409 *tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
411 (void) nfsm_strtom(nd, name, namelen);
413 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
414 *tl = txdr_unsigned(NFSV4OP_GETATTR);
415 NFSZERO_ATTRBIT(&attrbits);
416 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_CHANGE);
417 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TIMEMODIFY);
418 (void) nfsrv_putattrbit(nd, &attrbits);
420 nd->nd_flag |= ND_USEGSSNAME;
421 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
422 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
425 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
426 if (!nd->nd_repstat) {
427 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
429 op->nfso_stateid.seqid = *tl++;
430 op->nfso_stateid.other[0] = *tl++;
431 op->nfso_stateid.other[1] = *tl++;
432 op->nfso_stateid.other[2] = *tl;
433 rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
434 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
437 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
438 deleg = fxdr_unsigned(u_int32_t, *tl);
439 if (deleg == NFSV4OPEN_DELEGATEREAD ||
440 deleg == NFSV4OPEN_DELEGATEWRITE) {
441 if (!(op->nfso_own->nfsow_clp->nfsc_flags &
442 NFSCLFLAGS_FIRSTDELEG))
443 op->nfso_own->nfsow_clp->nfsc_flags |=
444 (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
445 MALLOC(ndp, struct nfscldeleg *,
446 sizeof (struct nfscldeleg) + newfhlen,
447 M_NFSCLDELEG, M_WAITOK);
448 LIST_INIT(&ndp->nfsdl_owner);
449 LIST_INIT(&ndp->nfsdl_lock);
450 ndp->nfsdl_clp = op->nfso_own->nfsow_clp;
451 ndp->nfsdl_fhlen = newfhlen;
452 NFSBCOPY(newfhp, ndp->nfsdl_fh, newfhlen);
453 newnfs_copyincred(cred, &ndp->nfsdl_cred);
454 nfscl_lockinit(&ndp->nfsdl_rwlock);
455 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
457 ndp->nfsdl_stateid.seqid = *tl++;
458 ndp->nfsdl_stateid.other[0] = *tl++;
459 ndp->nfsdl_stateid.other[1] = *tl++;
460 ndp->nfsdl_stateid.other[2] = *tl++;
461 ret = fxdr_unsigned(int, *tl);
462 if (deleg == NFSV4OPEN_DELEGATEWRITE) {
463 ndp->nfsdl_flags = NFSCLDL_WRITE;
465 * Indicates how much the file can grow.
467 NFSM_DISSECT(tl, u_int32_t *,
469 limitby = fxdr_unsigned(int, *tl++);
471 case NFSV4OPEN_LIMITSIZE:
472 ndp->nfsdl_sizelimit = fxdr_hyper(tl);
474 case NFSV4OPEN_LIMITBLOCKS:
475 ndp->nfsdl_sizelimit =
476 fxdr_unsigned(u_int64_t, *tl++);
477 ndp->nfsdl_sizelimit *=
478 fxdr_unsigned(u_int64_t, *tl);
481 error = NFSERR_BADXDR;
485 ndp->nfsdl_flags = NFSCLDL_READ;
488 ndp->nfsdl_flags |= NFSCLDL_RECALL;
489 error = nfsrv_dissectace(nd, &ndp->nfsdl_ace, &ret,
493 } else if (deleg != NFSV4OPEN_DELEGATENONE) {
494 error = NFSERR_BADXDR;
497 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
498 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
499 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
500 NULL, NULL, NULL, p, cred);
504 ndp->nfsdl_change = nfsva.na_filerev;
505 ndp->nfsdl_modtime = nfsva.na_mtime;
506 ndp->nfsdl_flags |= NFSCLDL_MODTIMESET;
508 if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM)) {
510 ret = nfsrpc_openconfirm(vp, newfhp, newfhlen, op,
512 if (ret == NFSERR_DELAY)
513 (void) nfs_catnap(PZERO, ret, "nfs_open");
514 } while (ret == NFSERR_DELAY);
517 if ((rflags & NFSV4OPEN_LOCKTYPEPOSIX) ||
518 nfscl_assumeposixlocks)
519 op->nfso_posixlock = 1;
521 op->nfso_posixlock = 0;
524 * If the server is handing out delegations, but we didn't
525 * get one because an OpenConfirm was required, try the
526 * Open again, to get a delegation. This is a harmless no-op,
527 * from a server's point of view.
529 if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM) &&
530 (op->nfso_own->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG)
531 && !error && dp == NULL && ndp == NULL && !recursed) {
533 ret = nfsrpc_openrpc(nmp, vp, nfhp, fhlen, newfhp,
534 newfhlen, mode, op, name, namelen, &ndp, 0, 0x0,
535 cred, p, syscred, 1);
536 if (ret == NFSERR_DELAY)
537 (void) nfs_catnap(PZERO, ret, "nfs_open2");
538 } while (ret == NFSERR_DELAY);
541 FREE((caddr_t)ndp, M_NFSCLDELEG);
542 if (ret == NFSERR_STALECLIENTID ||
543 ret == NFSERR_STALEDONTRECOVER ||
544 ret == NFSERR_BADSESSION)
549 if (nd->nd_repstat != 0 && error == 0)
550 error = nd->nd_repstat;
551 if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
552 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
556 else if (ndp != NULL)
557 FREE((caddr_t)ndp, M_NFSCLDELEG);
558 mbuf_freem(nd->nd_mrep);
566 nfsrpc_opendowngrade(vnode_t vp, u_int32_t mode, struct nfsclopen *op,
567 struct ucred *cred, NFSPROC_T *p)
570 struct nfsrv_descript nfsd, *nd = &nfsd;
573 NFSCL_REQSTART(nd, NFSPROC_OPENDOWNGRADE, vp);
574 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 3 * NFSX_UNSIGNED);
575 if (NFSHASNFSV4N(VFSTONFS(vnode_mount(vp))))
578 *tl++ = op->nfso_stateid.seqid;
579 *tl++ = op->nfso_stateid.other[0];
580 *tl++ = op->nfso_stateid.other[1];
581 *tl++ = op->nfso_stateid.other[2];
582 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
583 *tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
584 *tl = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
585 error = nfscl_request(nd, vp, p, cred, NULL);
588 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
589 if (!nd->nd_repstat) {
590 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
591 op->nfso_stateid.seqid = *tl++;
592 op->nfso_stateid.other[0] = *tl++;
593 op->nfso_stateid.other[1] = *tl++;
594 op->nfso_stateid.other[2] = *tl;
596 if (nd->nd_repstat && error == 0)
597 error = nd->nd_repstat;
598 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
599 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
601 mbuf_freem(nd->nd_mrep);
606 * V4 Close operation.
609 nfsrpc_close(vnode_t vp, int doclose, NFSPROC_T *p)
611 struct nfsclclient *clp;
614 if (vnode_vtype(vp) != VREG)
617 error = nfscl_doclose(vp, &clp, p);
619 error = nfscl_getclose(vp, &clp);
623 nfscl_clientrelease(clp);
631 nfsrpc_doclose(struct nfsmount *nmp, struct nfsclopen *op, NFSPROC_T *p)
633 struct nfsrv_descript nfsd, *nd = &nfsd;
634 struct nfscllockowner *lp, *nlp;
635 struct nfscllock *lop, *nlop;
637 u_int64_t off = 0, len = 0;
638 u_int32_t type = NFSV4LOCKT_READ;
639 int error, do_unlock, trycnt;
641 tcred = newnfs_getcred();
642 newnfs_copycred(&op->nfso_cred, tcred);
644 * (Theoretically this could be done in the same
645 * compound as the close, but having multiple
646 * sequenced Ops in the same compound might be
647 * too scary for some servers.)
649 if (op->nfso_posixlock) {
652 type = NFSV4LOCKT_READ;
656 * Since this function is only called from VOP_INACTIVE(), no
657 * other thread will be manipulating this Open. As such, the
658 * lock lists are not being changed by other threads, so it should
659 * be safe to do this without locking.
661 LIST_FOREACH(lp, &op->nfso_lock, nfsl_list) {
663 LIST_FOREACH_SAFE(lop, &lp->nfsl_lock, nfslo_list, nlop) {
664 if (op->nfso_posixlock == 0) {
665 off = lop->nfslo_first;
666 len = lop->nfslo_end - lop->nfslo_first;
667 if (lop->nfslo_type == F_WRLCK)
668 type = NFSV4LOCKT_WRITE;
670 type = NFSV4LOCKT_READ;
675 error = nfsrpc_locku(nd, nmp, lp, off,
676 len, type, tcred, p, 0);
677 if ((nd->nd_repstat == NFSERR_GRACE ||
678 nd->nd_repstat == NFSERR_DELAY) &&
680 (void) nfs_catnap(PZERO,
683 } while ((nd->nd_repstat == NFSERR_GRACE ||
684 nd->nd_repstat == NFSERR_DELAY) &&
685 error == 0 && trycnt++ < 5);
686 if (op->nfso_posixlock)
689 nfscl_freelock(lop, 0);
692 * Do a ReleaseLockOwner.
693 * The lock owner name nfsl_owner may be used by other opens for
694 * other files but the lock_owner4 name that nfsrpc_rellockown()
695 * puts on the wire has the file handle for this file appended
696 * to it, so it can be done now.
698 (void)nfsrpc_rellockown(nmp, lp, lp->nfsl_open->nfso_fh,
699 lp->nfsl_open->nfso_fhlen, tcred, p);
703 * There could be other Opens for different files on the same
704 * OpenOwner, so locking is required.
707 nfscl_lockexcl(&op->nfso_own->nfsow_rwlock, NFSCLSTATEMUTEXPTR);
710 error = nfscl_tryclose(op, tcred, nmp, p);
711 if (error == NFSERR_GRACE)
712 (void) nfs_catnap(PZERO, error, "nfs_close");
713 } while (error == NFSERR_GRACE);
715 nfscl_lockunlock(&op->nfso_own->nfsow_rwlock);
717 LIST_FOREACH_SAFE(lp, &op->nfso_lock, nfsl_list, nlp)
718 nfscl_freelockowner(lp, 0);
719 nfscl_freeopen(op, 0);
725 * The actual Close RPC.
728 nfsrpc_closerpc(struct nfsrv_descript *nd, struct nfsmount *nmp,
729 struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p,
735 nfscl_reqstart(nd, NFSPROC_CLOSE, nmp, op->nfso_fh,
736 op->nfso_fhlen, NULL, NULL);
737 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
738 *tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
739 if (NFSHASNFSV4N(nmp))
742 *tl++ = op->nfso_stateid.seqid;
743 *tl++ = op->nfso_stateid.other[0];
744 *tl++ = op->nfso_stateid.other[1];
745 *tl = op->nfso_stateid.other[2];
747 nd->nd_flag |= ND_USEGSSNAME;
748 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
749 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
752 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
753 if (nd->nd_repstat == 0)
754 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
755 error = nd->nd_repstat;
756 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
757 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
759 mbuf_freem(nd->nd_mrep);
764 * V4 Open Confirm RPC.
767 nfsrpc_openconfirm(vnode_t vp, u_int8_t *nfhp, int fhlen,
768 struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p)
771 struct nfsrv_descript nfsd, *nd = &nfsd;
772 struct nfsmount *nmp;
775 nmp = VFSTONFS(vnode_mount(vp));
776 if (NFSHASNFSV4N(nmp))
777 return (0); /* No confirmation for NFSv4.1. */
778 nfscl_reqstart(nd, NFSPROC_OPENCONFIRM, nmp, nfhp, fhlen, NULL, NULL);
779 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
780 *tl++ = op->nfso_stateid.seqid;
781 *tl++ = op->nfso_stateid.other[0];
782 *tl++ = op->nfso_stateid.other[1];
783 *tl++ = op->nfso_stateid.other[2];
784 *tl = txdr_unsigned(op->nfso_own->nfsow_seqid);
785 error = nfscl_request(nd, vp, p, cred, NULL);
788 NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
789 if (!nd->nd_repstat) {
790 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
791 op->nfso_stateid.seqid = *tl++;
792 op->nfso_stateid.other[0] = *tl++;
793 op->nfso_stateid.other[1] = *tl++;
794 op->nfso_stateid.other[2] = *tl;
796 error = nd->nd_repstat;
797 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
798 nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
800 mbuf_freem(nd->nd_mrep);
805 * Do the setclientid and setclientid confirm RPCs. Called from nfs_statfs()
806 * when a mount has just occurred and when the server replies NFSERR_EXPIRED.
809 nfsrpc_setclient(struct nfsmount *nmp, struct nfsclclient *clp, int reclaim,
810 struct ucred *cred, NFSPROC_T *p)
813 struct nfsrv_descript nfsd;
814 struct nfsrv_descript *nd = &nfsd;
815 nfsattrbit_t attrbits;
816 u_int8_t *cp = NULL, *cp2, addr[INET6_ADDRSTRLEN + 9];
818 int error, isinet6 = 0, callblen;
821 static u_int32_t rev = 0;
822 struct nfsclds *dsp, *ndsp, *tdsp;
824 if (nfsboottime.tv_sec == 0)
825 NFSSETBOOTTIME(nfsboottime);
826 clp->nfsc_rev = rev++;
827 if (NFSHASNFSV4N(nmp)) {
828 error = nfsrpc_exchangeid(nmp, clp, &nmp->nm_sockreq,
829 NFSV4EXCH_USEPNFSMDS | NFSV4EXCH_USENONPNFS, &dsp, cred, p);
830 NFSCL_DEBUG(1, "aft exch=%d\n", error);
832 error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
834 dsp->nfsclds_sess.nfsess_sequenceid, 1, cred, p);
837 TAILQ_FOREACH_SAFE(tdsp, &nmp->nm_sess,
839 nfscl_freenfsclds(tdsp);
840 TAILQ_INIT(&nmp->nm_sess);
841 TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp,
845 nfscl_freenfsclds(dsp);
846 NFSCL_DEBUG(1, "aft createsess=%d\n", error);
848 if (error == 0 && reclaim == 0) {
849 error = nfsrpc_reclaimcomplete(nmp, cred, p);
850 NFSCL_DEBUG(1, "aft reclaimcomp=%d\n", error);
851 if (error == NFSERR_COMPLETEALREADY ||
852 error == NFSERR_NOTSUPP)
853 /* Ignore this error. */
860 * Allocate a single session structure for NFSv4.0, because some of
861 * the fields are used by NFSv4.0 although it doesn't do a session.
863 dsp = malloc(sizeof(struct nfsclds), M_NFSCLDS, M_WAITOK | M_ZERO);
864 mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
865 mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession", NULL, MTX_DEF);
867 TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp, nfsclds_list);
870 nfscl_reqstart(nd, NFSPROC_SETCLIENTID, nmp, NULL, 0, NULL, NULL);
871 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
872 *tl++ = txdr_unsigned(nfsboottime.tv_sec);
873 *tl = txdr_unsigned(clp->nfsc_rev);
874 (void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
877 * set up the callback address
879 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
880 *tl = txdr_unsigned(NFS_CALLBCKPROG);
881 callblen = strlen(nfsv4_callbackaddr);
883 cp = nfscl_getmyip(nmp, &isinet6);
884 if (nfscl_enablecallb && nfs_numnfscbd > 0 &&
885 (callblen > 0 || cp != NULL)) {
886 port = htons(nfsv4_cbport);
887 cp2 = (u_int8_t *)&port;
890 strchr(nfsv4_callbackaddr, ':')) || isinet6) {
891 char ip6buf[INET6_ADDRSTRLEN], *ip6add;
893 (void) nfsm_strtom(nd, "tcp6", 4);
895 ip6_sprintf(ip6buf, (struct in6_addr *)cp);
898 ip6add = nfsv4_callbackaddr;
900 snprintf(addr, INET6_ADDRSTRLEN + 9, "%s.%d.%d",
901 ip6add, cp2[0], cp2[1]);
905 (void) nfsm_strtom(nd, "tcp", 3);
907 snprintf(addr, INET6_ADDRSTRLEN + 9,
908 "%d.%d.%d.%d.%d.%d", cp[0], cp[1],
909 cp[2], cp[3], cp2[0], cp2[1]);
911 snprintf(addr, INET6_ADDRSTRLEN + 9,
912 "%s.%d.%d", nfsv4_callbackaddr,
915 (void) nfsm_strtom(nd, addr, strlen(addr));
917 (void) nfsm_strtom(nd, "tcp", 3);
918 (void) nfsm_strtom(nd, "0.0.0.0.0.0", 11);
920 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
921 *tl = txdr_unsigned(clp->nfsc_cbident);
922 nd->nd_flag |= ND_USEGSSNAME;
923 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
924 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
927 if (nd->nd_repstat == 0) {
928 NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
929 NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0] = *tl++;
930 NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1] = *tl++;
931 confirm.lval[0] = *tl++;
932 confirm.lval[1] = *tl;
933 mbuf_freem(nd->nd_mrep);
939 nfscl_reqstart(nd, NFSPROC_SETCLIENTIDCFRM, nmp, NULL, 0, NULL,
941 NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
942 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
943 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
944 *tl++ = confirm.lval[0];
945 *tl = confirm.lval[1];
946 nd->nd_flag |= ND_USEGSSNAME;
947 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
948 cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
951 mbuf_freem(nd->nd_mrep);
953 if (nd->nd_repstat == 0) {
954 nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, nmp->nm_fh,
955 nmp->nm_fhsize, NULL, NULL);
956 NFSZERO_ATTRBIT(&attrbits);
957 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
958 (void) nfsrv_putattrbit(nd, &attrbits);
959 nd->nd_flag |= ND_USEGSSNAME;
960 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
961 cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
964 if (nd->nd_repstat == 0) {
965 error = nfsv4_loadattr(nd, NULL, NULL, NULL, NULL, 0, NULL,
966 NULL, NULL, NULL, NULL, 0, NULL, &lease, NULL, p, cred);
969 clp->nfsc_renew = NFSCL_RENEW(lease);
970 clp->nfsc_expire = NFSD_MONOSEC + clp->nfsc_renew;
971 clp->nfsc_clientidrev++;
972 if (clp->nfsc_clientidrev == 0)
973 clp->nfsc_clientidrev++;
977 error = nd->nd_repstat;
979 mbuf_freem(nd->nd_mrep);
987 nfsrpc_getattr(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
988 struct nfsvattr *nap, void *stuff)
990 struct nfsrv_descript nfsd, *nd = &nfsd;
992 nfsattrbit_t attrbits;
994 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
995 if (nd->nd_flag & ND_NFSV4) {
996 NFSGETATTR_ATTRBIT(&attrbits);
997 (void) nfsrv_putattrbit(nd, &attrbits);
999 error = nfscl_request(nd, vp, p, cred, stuff);
1002 if (!nd->nd_repstat)
1003 error = nfsm_loadattr(nd, nap);
1005 error = nd->nd_repstat;
1006 mbuf_freem(nd->nd_mrep);
1011 * nfs getattr call with non-vnode arguemnts.
1014 nfsrpc_getattrnovp(struct nfsmount *nmp, u_int8_t *fhp, int fhlen, int syscred,
1015 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, u_int64_t *xidp,
1018 struct nfsrv_descript nfsd, *nd = &nfsd;
1019 int error, vers = NFS_VER2;
1020 nfsattrbit_t attrbits;
1022 nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, fhp, fhlen, NULL, NULL);
1023 if (nd->nd_flag & ND_NFSV4) {
1025 NFSGETATTR_ATTRBIT(&attrbits);
1026 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
1027 (void) nfsrv_putattrbit(nd, &attrbits);
1028 } else if (nd->nd_flag & ND_NFSV3) {
1032 nd->nd_flag |= ND_USEGSSNAME;
1033 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
1034 NFS_PROG, vers, NULL, 1, xidp, NULL);
1037 if (nd->nd_repstat == 0) {
1038 if ((nd->nd_flag & ND_NFSV4) != 0)
1039 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
1040 NULL, NULL, NULL, NULL, NULL, 0, NULL, leasep, NULL,
1043 error = nfsm_loadattr(nd, nap);
1045 error = nd->nd_repstat;
1046 mbuf_freem(nd->nd_mrep);
1051 * Do an nfs setattr operation.
1054 nfsrpc_setattr(vnode_t vp, struct vattr *vap, NFSACL_T *aclp,
1055 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *rnap, int *attrflagp,
1058 int error, expireret = 0, openerr, retrycnt;
1059 u_int32_t clidrev = 0, mode;
1060 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1062 nfsv4stateid_t stateid;
1065 if (nmp->nm_clp != NULL)
1066 clidrev = nmp->nm_clp->nfsc_clientidrev;
1067 if (vap != NULL && NFSATTRISSET(u_quad_t, vap, va_size))
1068 mode = NFSV4OPEN_ACCESSWRITE;
1070 mode = NFSV4OPEN_ACCESSREAD;
1075 if (NFSHASNFSV4(nmp)) {
1076 nfhp = VTONFS(vp)->n_fhp;
1077 error = nfscl_getstateid(vp, nfhp->nfh_fh,
1078 nfhp->nfh_len, mode, 0, cred, p, &stateid, &lckp);
1079 if (error && vnode_vtype(vp) == VREG &&
1080 (mode == NFSV4OPEN_ACCESSWRITE ||
1081 nfstest_openallsetattr)) {
1083 * No Open stateid, so try and open the file
1086 if (mode == NFSV4OPEN_ACCESSWRITE)
1087 openerr = nfsrpc_open(vp, FWRITE, cred,
1090 openerr = nfsrpc_open(vp, FREAD, cred,
1093 (void) nfscl_getstateid(vp,
1094 nfhp->nfh_fh, nfhp->nfh_len,
1095 mode, 0, cred, p, &stateid, &lckp);
1099 error = nfsrpc_setattrrpc(vp, vap, &stateid, cred, p,
1100 rnap, attrflagp, stuff);
1102 error = nfsrpc_setaclrpc(vp, cred, p, aclp, &stateid,
1104 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1105 nfscl_initiate_recovery(nmp->nm_clp);
1107 nfscl_lockderef(lckp);
1109 (void) nfsrpc_close(vp, 0, p);
1110 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1111 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1112 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1113 (void) nfs_catnap(PZERO, error, "nfs_setattr");
1114 } else if ((error == NFSERR_EXPIRED ||
1115 error == NFSERR_BADSTATEID) && clidrev != 0) {
1116 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1119 } while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1120 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1121 error == NFSERR_BADSESSION ||
1122 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1123 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1124 expireret == 0 && clidrev != 0 && retrycnt < 4));
1125 if (error && retrycnt >= 4)
1131 nfsrpc_setattrrpc(vnode_t vp, struct vattr *vap,
1132 nfsv4stateid_t *stateidp, struct ucred *cred, NFSPROC_T *p,
1133 struct nfsvattr *rnap, int *attrflagp, void *stuff)
1136 struct nfsrv_descript nfsd, *nd = &nfsd;
1138 nfsattrbit_t attrbits;
1141 NFSCL_REQSTART(nd, NFSPROC_SETATTR, vp);
1142 if (nd->nd_flag & ND_NFSV4)
1143 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1144 vap->va_type = vnode_vtype(vp);
1145 nfscl_fillsattr(nd, vap, vp, NFSSATTR_FULL, 0);
1146 if (nd->nd_flag & ND_NFSV3) {
1147 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1149 } else if (nd->nd_flag & ND_NFSV4) {
1150 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1151 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1152 NFSGETATTR_ATTRBIT(&attrbits);
1153 (void) nfsrv_putattrbit(nd, &attrbits);
1155 error = nfscl_request(nd, vp, p, cred, stuff);
1158 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1159 error = nfscl_wcc_data(nd, vp, rnap, attrflagp, NULL, stuff);
1160 if ((nd->nd_flag & ND_NFSV4) && !error)
1161 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1162 if (!(nd->nd_flag & ND_NFSV3) && !nd->nd_repstat && !error)
1163 error = nfscl_postop_attr(nd, rnap, attrflagp, stuff);
1164 mbuf_freem(nd->nd_mrep);
1165 if (nd->nd_repstat && !error)
1166 error = nd->nd_repstat;
1174 nfsrpc_lookup(vnode_t dvp, char *name, int len, struct ucred *cred,
1175 NFSPROC_T *p, struct nfsvattr *dnap, struct nfsvattr *nap,
1176 struct nfsfh **nfhpp, int *attrflagp, int *dattrflagp, void *stuff)
1179 struct nfsrv_descript nfsd, *nd = &nfsd;
1180 struct nfsmount *nmp;
1183 nfsattrbit_t attrbits;
1184 int error = 0, lookupp = 0;
1188 if (vnode_vtype(dvp) != VDIR)
1190 nmp = VFSTONFS(vnode_mount(dvp));
1191 if (len > NFS_MAXNAMLEN)
1192 return (ENAMETOOLONG);
1193 if (NFSHASNFSV4(nmp) && len == 1 &&
1196 * Just return the current dir's fh.
1199 MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1200 np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1201 nfhp->nfh_len = np->n_fhp->nfh_len;
1202 NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1206 if (NFSHASNFSV4(nmp) && len == 2 &&
1207 name[0] == '.' && name[1] == '.') {
1209 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, dvp);
1211 NFSCL_REQSTART(nd, NFSPROC_LOOKUP, dvp);
1212 (void) nfsm_strtom(nd, name, len);
1214 if (nd->nd_flag & ND_NFSV4) {
1215 NFSGETATTR_ATTRBIT(&attrbits);
1216 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1217 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
1218 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1219 (void) nfsrv_putattrbit(nd, &attrbits);
1221 error = nfscl_request(nd, dvp, p, cred, stuff);
1224 if (nd->nd_repstat) {
1226 * When an NFSv4 Lookupp returns ENOENT, it means that
1227 * the lookup is at the root of an fs, so return this dir.
1229 if (nd->nd_repstat == NFSERR_NOENT && lookupp) {
1231 MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1232 np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1233 nfhp->nfh_len = np->n_fhp->nfh_len;
1234 NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1236 mbuf_freem(nd->nd_mrep);
1239 if (nd->nd_flag & ND_NFSV3)
1240 error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1243 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
1244 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1246 nd->nd_flag |= ND_NOMOREDATA;
1250 error = nfsm_getfh(nd, nfhpp);
1254 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1255 if ((nd->nd_flag & ND_NFSV3) && !error)
1256 error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1258 mbuf_freem(nd->nd_mrep);
1259 if (!error && nd->nd_repstat)
1260 error = nd->nd_repstat;
1265 * Do a readlink rpc.
1268 nfsrpc_readlink(vnode_t vp, struct uio *uiop, struct ucred *cred,
1269 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1272 struct nfsrv_descript nfsd, *nd = &nfsd;
1273 struct nfsnode *np = VTONFS(vp);
1274 nfsattrbit_t attrbits;
1275 int error, len, cangetattr = 1;
1278 NFSCL_REQSTART(nd, NFSPROC_READLINK, vp);
1279 if (nd->nd_flag & ND_NFSV4) {
1281 * And do a Getattr op.
1283 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1284 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1285 NFSGETATTR_ATTRBIT(&attrbits);
1286 (void) nfsrv_putattrbit(nd, &attrbits);
1288 error = nfscl_request(nd, vp, p, cred, stuff);
1291 if (nd->nd_flag & ND_NFSV3)
1292 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1293 if (!nd->nd_repstat && !error) {
1294 NFSM_STRSIZ(len, NFS_MAXPATHLEN);
1296 * This seems weird to me, but must have been added to
1297 * FreeBSD for some reason. The only thing I can think of
1298 * is that there was/is some server that replies with
1299 * more link data than it should?
1301 if (len == NFS_MAXPATHLEN) {
1303 if (np->n_size > 0 && np->n_size < NFS_MAXPATHLEN) {
1309 error = nfsm_mbufuio(nd, uiop, len);
1310 if ((nd->nd_flag & ND_NFSV4) && !error && cangetattr)
1311 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1313 if (nd->nd_repstat && !error)
1314 error = nd->nd_repstat;
1316 mbuf_freem(nd->nd_mrep);
1324 nfsrpc_read(vnode_t vp, struct uio *uiop, struct ucred *cred,
1325 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1327 int error, expireret = 0, retrycnt;
1328 u_int32_t clidrev = 0;
1329 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1330 struct nfsnode *np = VTONFS(vp);
1331 struct ucred *newcred;
1332 struct nfsfh *nfhp = NULL;
1333 nfsv4stateid_t stateid;
1336 if (nmp->nm_clp != NULL)
1337 clidrev = nmp->nm_clp->nfsc_clientidrev;
1339 if (NFSHASNFSV4(nmp)) {
1341 newcred = NFSNEWCRED(cred);
1346 if (NFSHASNFSV4(nmp))
1347 (void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1348 NFSV4OPEN_ACCESSREAD, 0, newcred, p, &stateid,
1350 error = nfsrpc_readrpc(vp, uiop, newcred, &stateid, p, nap,
1352 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1353 nfscl_initiate_recovery(nmp->nm_clp);
1355 nfscl_lockderef(lckp);
1356 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1357 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1358 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1359 (void) nfs_catnap(PZERO, error, "nfs_read");
1360 } else if ((error == NFSERR_EXPIRED ||
1361 error == NFSERR_BADSTATEID) && clidrev != 0) {
1362 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1365 } while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1366 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1367 error == NFSERR_BADSESSION ||
1368 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1369 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1370 expireret == 0 && clidrev != 0 && retrycnt < 4));
1371 if (error && retrycnt >= 4)
1373 if (NFSHASNFSV4(nmp))
1374 NFSFREECRED(newcred);
1379 * The actual read RPC.
1382 nfsrpc_readrpc(vnode_t vp, struct uio *uiop, struct ucred *cred,
1383 nfsv4stateid_t *stateidp, NFSPROC_T *p, struct nfsvattr *nap,
1384 int *attrflagp, void *stuff)
1387 int error = 0, len, retlen, tsiz, eof = 0;
1388 struct nfsrv_descript nfsd;
1389 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1390 struct nfsrv_descript *nd = &nfsd;
1395 tsiz = uio_uio_resid(uiop);
1396 tmp_off = uiop->uio_offset + tsiz;
1398 if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1402 rsize = nmp->nm_rsize;
1407 len = (tsiz > rsize) ? rsize : tsiz;
1408 NFSCL_REQSTART(nd, NFSPROC_READ, vp);
1409 if (nd->nd_flag & ND_NFSV4)
1410 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1411 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED * 3);
1412 if (nd->nd_flag & ND_NFSV2) {
1413 *tl++ = txdr_unsigned(uiop->uio_offset);
1414 *tl++ = txdr_unsigned(len);
1417 txdr_hyper(uiop->uio_offset, tl);
1418 *(tl + 2) = txdr_unsigned(len);
1421 * Since I can't do a Getattr for NFSv4 for Write, there
1422 * doesn't seem any point in doing one here, either.
1423 * (See the comment in nfsrpc_writerpc() for more info.)
1425 error = nfscl_request(nd, vp, p, cred, stuff);
1428 if (nd->nd_flag & ND_NFSV3) {
1429 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1430 } else if (!nd->nd_repstat && (nd->nd_flag & ND_NFSV2)) {
1431 error = nfsm_loadattr(nd, nap);
1435 if (nd->nd_repstat || error) {
1437 error = nd->nd_repstat;
1440 if (nd->nd_flag & ND_NFSV3) {
1441 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1442 eof = fxdr_unsigned(int, *(tl + 1));
1443 } else if (nd->nd_flag & ND_NFSV4) {
1444 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
1445 eof = fxdr_unsigned(int, *tl);
1447 NFSM_STRSIZ(retlen, len);
1448 error = nfsm_mbufuio(nd, uiop, retlen);
1451 mbuf_freem(nd->nd_mrep);
1454 if (!(nd->nd_flag & ND_NFSV2)) {
1455 if (eof || retlen == 0)
1457 } else if (retlen < len)
1462 if (nd->nd_mrep != NULL)
1463 mbuf_freem(nd->nd_mrep);
1468 * nfs write operation
1469 * When called_from_strategy != 0, it should return EIO for an error that
1470 * indicates recovery is in progress, so that the buffer will be left
1471 * dirty and be written back to the server later. If it loops around,
1472 * the recovery thread could get stuck waiting for the buffer and recovery
1473 * will then deadlock.
1476 nfsrpc_write(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
1477 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
1478 void *stuff, int called_from_strategy)
1480 int error, expireret = 0, retrycnt, nostateid;
1481 u_int32_t clidrev = 0;
1482 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1483 struct nfsnode *np = VTONFS(vp);
1484 struct ucred *newcred;
1485 struct nfsfh *nfhp = NULL;
1486 nfsv4stateid_t stateid;
1490 if (nmp->nm_clp != NULL)
1491 clidrev = nmp->nm_clp->nfsc_clientidrev;
1493 if (NFSHASNFSV4(nmp)) {
1494 newcred = NFSNEWCRED(cred);
1501 if (NFSHASNFSV4(nmp)) {
1502 (void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1503 NFSV4OPEN_ACCESSWRITE, 0, newcred, p, &stateid,
1505 if (stateid.other[0] == 0 && stateid.other[1] == 0 &&
1506 stateid.other[2] == 0) {
1508 NFSCL_DEBUG(1, "stateid0 in write\n");
1513 * If there is no stateid for NFSv4, it means this is an
1514 * extraneous write after close. Basically a poorly
1515 * implemented buffer cache. Just don't do the write.
1520 error = nfsrpc_writerpc(vp, uiop, iomode, must_commit,
1521 newcred, &stateid, p, nap, attrflagp, stuff);
1522 if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1523 nfscl_initiate_recovery(nmp->nm_clp);
1525 nfscl_lockderef(lckp);
1526 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1527 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1528 error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1529 (void) nfs_catnap(PZERO, error, "nfs_write");
1530 } else if ((error == NFSERR_EXPIRED ||
1531 error == NFSERR_BADSTATEID) && clidrev != 0) {
1532 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1535 } while (error == NFSERR_GRACE || error == NFSERR_DELAY ||
1536 ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1537 error == NFSERR_STALEDONTRECOVER) && called_from_strategy == 0) ||
1538 (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1539 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1540 expireret == 0 && clidrev != 0 && retrycnt < 4));
1541 if (error != 0 && (retrycnt >= 4 ||
1542 ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1543 error == NFSERR_STALEDONTRECOVER) && called_from_strategy != 0)))
1545 if (NFSHASNFSV4(nmp))
1546 NFSFREECRED(newcred);
1551 * The actual write RPC.
1554 nfsrpc_writerpc(vnode_t vp, struct uio *uiop, int *iomode,
1555 int *must_commit, struct ucred *cred, nfsv4stateid_t *stateidp,
1556 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1559 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1560 struct nfsnode *np = VTONFS(vp);
1561 int error = 0, len, tsiz, rlen, commit, committed = NFSWRITE_FILESYNC;
1562 int wccflag = 0, wsize;
1564 struct nfsrv_descript nfsd;
1565 struct nfsrv_descript *nd = &nfsd;
1566 nfsattrbit_t attrbits;
1569 KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
1571 tsiz = uio_uio_resid(uiop);
1572 tmp_off = uiop->uio_offset + tsiz;
1574 if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1578 wsize = nmp->nm_wsize;
1580 nd->nd_mrep = NULL; /* NFSv2 sometimes does a write with */
1581 nd->nd_repstat = 0; /* uio_resid == 0, so the while is not done */
1584 len = (tsiz > wsize) ? wsize : tsiz;
1585 NFSCL_REQSTART(nd, NFSPROC_WRITE, vp);
1586 if (nd->nd_flag & ND_NFSV4) {
1587 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1588 NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+2*NFSX_UNSIGNED);
1589 txdr_hyper(uiop->uio_offset, tl);
1591 *tl++ = txdr_unsigned(*iomode);
1592 *tl = txdr_unsigned(len);
1593 } else if (nd->nd_flag & ND_NFSV3) {
1594 NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+3*NFSX_UNSIGNED);
1595 txdr_hyper(uiop->uio_offset, tl);
1597 *tl++ = txdr_unsigned(len);
1598 *tl++ = txdr_unsigned(*iomode);
1599 *tl = txdr_unsigned(len);
1603 NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1605 * Not sure why someone changed this, since the
1606 * RFC clearly states that "beginoffset" and
1607 * "totalcount" are ignored, but it wouldn't
1608 * surprise me if there's a busted server out there.
1610 /* Set both "begin" and "current" to non-garbage. */
1611 x = txdr_unsigned((u_int32_t)uiop->uio_offset);
1612 *tl++ = x; /* "begin offset" */
1613 *tl++ = x; /* "current offset" */
1614 x = txdr_unsigned(len);
1615 *tl++ = x; /* total to this offset */
1616 *tl = x; /* size of this write */
1619 nfsm_uiombuf(nd, uiop, len);
1621 * Although it is tempting to do a normal Getattr Op in the
1622 * NFSv4 compound, the result can be a nearly hung client
1623 * system if the Getattr asks for Owner and/or OwnerGroup.
1624 * It occurs when the client can't map either the Owner or
1625 * Owner_group name in the Getattr reply to a uid/gid. When
1626 * there is a cache miss, the kernel does an upcall to the
1627 * nfsuserd. Then, it can try and read the local /etc/passwd
1628 * or /etc/group file. It can then block in getnewbuf(),
1629 * waiting for dirty writes to be pushed to the NFS server.
1630 * The only reason this doesn't result in a complete
1631 * deadlock, is that the upcall times out and allows
1632 * the write to complete. However, progress is so slow
1633 * that it might just as well be deadlocked.
1634 * As such, we get the rest of the attributes, but not
1635 * Owner or Owner_group.
1636 * nb: nfscl_loadattrcache() needs to be told that these
1637 * partial attributes from a write rpc are being
1638 * passed in, via a argument flag.
1640 if (nd->nd_flag & ND_NFSV4) {
1641 NFSWRITEGETATTR_ATTRBIT(&attrbits);
1642 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1643 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1644 (void) nfsrv_putattrbit(nd, &attrbits);
1646 error = nfscl_request(nd, vp, p, cred, stuff);
1649 if (nd->nd_repstat) {
1651 * In case the rpc gets retried, roll
1652 * the uio fileds changed by nfsm_uiombuf()
1655 uiop->uio_offset -= len;
1656 uio_uio_resid_add(uiop, len);
1657 uio_iov_base_add(uiop, -len);
1658 uio_iov_len_add(uiop, len);
1660 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1661 error = nfscl_wcc_data(nd, vp, nap, attrflagp,
1666 if (!nd->nd_repstat) {
1667 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1668 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED
1670 rlen = fxdr_unsigned(int, *tl++);
1674 } else if (rlen < len) {
1675 backup = len - rlen;
1676 uio_iov_base_add(uiop, -(backup));
1677 uio_iov_len_add(uiop, backup);
1678 uiop->uio_offset -= backup;
1679 uio_uio_resid_add(uiop, backup);
1682 commit = fxdr_unsigned(int, *tl++);
1685 * Return the lowest committment level
1686 * obtained by any of the RPCs.
1688 if (committed == NFSWRITE_FILESYNC)
1690 else if (committed == NFSWRITE_DATASYNC &&
1691 commit == NFSWRITE_UNSTABLE)
1694 if (!NFSHASWRITEVERF(nmp)) {
1695 NFSBCOPY((caddr_t)tl,
1696 (caddr_t)&nmp->nm_verf[0],
1698 NFSSETWRITEVERF(nmp);
1699 } else if (NFSBCMP(tl, nmp->nm_verf,
1702 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
1706 if (nd->nd_flag & ND_NFSV4)
1707 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1708 if (nd->nd_flag & (ND_NFSV2 | ND_NFSV4)) {
1709 error = nfsm_loadattr(nd, nap);
1711 *attrflagp = NFS_LATTR_NOSHRINK;
1714 error = nd->nd_repstat;
1718 NFSWRITERPC_SETTIME(wccflag, np, (nd->nd_flag & ND_NFSV4));
1719 mbuf_freem(nd->nd_mrep);
1724 if (nd->nd_mrep != NULL)
1725 mbuf_freem(nd->nd_mrep);
1726 *iomode = committed;
1727 if (nd->nd_repstat && !error)
1728 error = nd->nd_repstat;
1734 * For NFS v2 this is a kludge. Use a create rpc but with the IFMT bits of the
1735 * mode set to specify the file type and the size field for rdev.
1738 nfsrpc_mknod(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1739 u_int32_t rdev, enum vtype vtyp, struct ucred *cred, NFSPROC_T *p,
1740 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1741 int *attrflagp, int *dattrflagp, void *dstuff)
1745 struct nfsrv_descript nfsd, *nd = &nfsd;
1746 nfsattrbit_t attrbits;
1751 if (namelen > NFS_MAXNAMLEN)
1752 return (ENAMETOOLONG);
1753 NFSCL_REQSTART(nd, NFSPROC_MKNOD, dvp);
1754 if (nd->nd_flag & ND_NFSV4) {
1755 if (vtyp == VBLK || vtyp == VCHR) {
1756 NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
1757 *tl++ = vtonfsv34_type(vtyp);
1758 *tl++ = txdr_unsigned(NFSMAJOR(rdev));
1759 *tl = txdr_unsigned(NFSMINOR(rdev));
1761 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1762 *tl = vtonfsv34_type(vtyp);
1765 (void) nfsm_strtom(nd, name, namelen);
1766 if (nd->nd_flag & ND_NFSV3) {
1767 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1768 *tl = vtonfsv34_type(vtyp);
1770 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1771 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1772 if ((nd->nd_flag & ND_NFSV3) &&
1773 (vtyp == VCHR || vtyp == VBLK)) {
1774 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1775 *tl++ = txdr_unsigned(NFSMAJOR(rdev));
1776 *tl = txdr_unsigned(NFSMINOR(rdev));
1778 if (nd->nd_flag & ND_NFSV4) {
1779 NFSGETATTR_ATTRBIT(&attrbits);
1780 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1781 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
1782 *tl = txdr_unsigned(NFSV4OP_GETATTR);
1783 (void) nfsrv_putattrbit(nd, &attrbits);
1785 if (nd->nd_flag & ND_NFSV2)
1786 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZERDEV, rdev);
1787 error = nfscl_request(nd, dvp, p, cred, dstuff);
1790 if (nd->nd_flag & ND_NFSV4)
1791 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1792 if (!nd->nd_repstat) {
1793 if (nd->nd_flag & ND_NFSV4) {
1794 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1795 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1799 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1803 if (nd->nd_flag & ND_NFSV3)
1804 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1805 if (!error && nd->nd_repstat)
1806 error = nd->nd_repstat;
1808 mbuf_freem(nd->nd_mrep);
1813 * nfs file create call
1814 * Mostly just call the approriate routine. (I separated out v4, so that
1815 * error recovery wouldn't be as difficult.)
1818 nfsrpc_create(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1819 nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1820 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1821 int *attrflagp, int *dattrflagp, void *dstuff)
1823 int error = 0, newone, expireret = 0, retrycnt, unlocked;
1824 struct nfsclowner *owp;
1825 struct nfscldeleg *dp;
1826 struct nfsmount *nmp = VFSTONFS(vnode_mount(dvp));
1829 if (NFSHASNFSV4(nmp)) {
1833 error = nfscl_open(dvp, NULL, 0, (NFSV4OPEN_ACCESSWRITE |
1834 NFSV4OPEN_ACCESSREAD), 0, cred, p, &owp, NULL, &newone,
1838 if (nmp->nm_clp != NULL)
1839 clidrev = nmp->nm_clp->nfsc_clientidrev;
1842 error = nfsrpc_createv4(dvp, name, namelen, vap, cverf, fmode,
1843 owp, &dp, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1846 * There is no need to invalidate cached attributes here,
1847 * since new post-delegation issue attributes are always
1848 * returned by nfsrpc_createv4() and these will update the
1852 (void) nfscl_deleg(nmp->nm_mountp, owp->nfsow_clp,
1853 (*nfhpp)->nfh_fh, (*nfhpp)->nfh_len, cred, p, &dp);
1854 nfscl_ownerrelease(owp, error, newone, unlocked);
1855 if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1856 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1857 error == NFSERR_BADSESSION) {
1858 (void) nfs_catnap(PZERO, error, "nfs_open");
1859 } else if ((error == NFSERR_EXPIRED ||
1860 error == NFSERR_BADSTATEID) && clidrev != 0) {
1861 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1864 } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1865 error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1866 error == NFSERR_BADSESSION ||
1867 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1868 expireret == 0 && clidrev != 0 && retrycnt < 4));
1869 if (error && retrycnt >= 4)
1872 error = nfsrpc_createv23(dvp, name, namelen, vap, cverf,
1873 fmode, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1880 * The create rpc for v2 and 3.
1883 nfsrpc_createv23(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1884 nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1885 struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1886 int *attrflagp, int *dattrflagp, void *dstuff)
1890 struct nfsrv_descript nfsd, *nd = &nfsd;
1895 if (namelen > NFS_MAXNAMLEN)
1896 return (ENAMETOOLONG);
1897 NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1898 (void) nfsm_strtom(nd, name, namelen);
1899 if (nd->nd_flag & ND_NFSV3) {
1900 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1901 if (fmode & O_EXCL) {
1902 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1903 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1904 *tl++ = cverf.lval[0];
1905 *tl = cverf.lval[1];
1907 *tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1908 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1911 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZE0, 0);
1913 error = nfscl_request(nd, dvp, p, cred, dstuff);
1916 if (nd->nd_repstat == 0) {
1917 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1921 if (nd->nd_flag & ND_NFSV3)
1922 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1923 if (nd->nd_repstat != 0 && error == 0)
1924 error = nd->nd_repstat;
1926 mbuf_freem(nd->nd_mrep);
1931 nfsrpc_createv4(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1932 nfsquad_t cverf, int fmode, struct nfsclowner *owp, struct nfscldeleg **dpp,
1933 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
1934 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
1935 int *dattrflagp, void *dstuff, int *unlockedp)
1938 int error = 0, deleg, newone, ret, acesize, limitby;
1939 struct nfsrv_descript nfsd, *nd = &nfsd;
1940 struct nfsclopen *op;
1941 struct nfscldeleg *dp = NULL;
1944 nfsattrbit_t attrbits;
1945 nfsv4stateid_t stateid;
1947 struct nfsmount *nmp;
1949 nmp = VFSTONFS(dvp->v_mount);
1955 if (namelen > NFS_MAXNAMLEN)
1956 return (ENAMETOOLONG);
1957 NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1959 * For V4, this is actually an Open op.
1961 NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1962 *tl++ = txdr_unsigned(owp->nfsow_seqid);
1963 *tl++ = txdr_unsigned(NFSV4OPEN_ACCESSWRITE |
1964 NFSV4OPEN_ACCESSREAD);
1965 *tl++ = txdr_unsigned(NFSV4OPEN_DENYNONE);
1966 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
1967 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
1968 (void) nfsm_strtom(nd, owp->nfsow_owner, NFSV4CL_LOCKNAMELEN);
1969 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1970 *tl++ = txdr_unsigned(NFSV4OPEN_CREATE);
1971 if (fmode & O_EXCL) {
1972 if (NFSHASNFSV4N(nmp)) {
1973 if (NFSHASSESSPERSIST(nmp)) {
1974 /* Use GUARDED for persistent sessions. */
1975 *tl = txdr_unsigned(NFSCREATE_GUARDED);
1976 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1978 /* Otherwise, use EXCLUSIVE4_1. */
1979 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE41);
1980 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1981 *tl++ = cverf.lval[0];
1982 *tl = cverf.lval[1];
1983 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1987 *tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1988 NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1989 *tl++ = cverf.lval[0];
1990 *tl = cverf.lval[1];
1993 *tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1994 nfscl_fillsattr(nd, vap, dvp, 0, 0);
1996 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1997 *tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
1998 (void) nfsm_strtom(nd, name, namelen);
1999 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2000 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2001 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2002 NFSGETATTR_ATTRBIT(&attrbits);
2003 (void) nfsrv_putattrbit(nd, &attrbits);
2004 error = nfscl_request(nd, dvp, p, cred, dstuff);
2007 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2010 NFSCL_INCRSEQID(owp->nfsow_seqid, nd);
2011 if (nd->nd_repstat == 0) {
2012 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2014 stateid.seqid = *tl++;
2015 stateid.other[0] = *tl++;
2016 stateid.other[1] = *tl++;
2017 stateid.other[2] = *tl;
2018 rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
2019 (void) nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2020 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2021 deleg = fxdr_unsigned(int, *tl);
2022 if (deleg == NFSV4OPEN_DELEGATEREAD ||
2023 deleg == NFSV4OPEN_DELEGATEWRITE) {
2024 if (!(owp->nfsow_clp->nfsc_flags &
2025 NFSCLFLAGS_FIRSTDELEG))
2026 owp->nfsow_clp->nfsc_flags |=
2027 (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
2028 MALLOC(dp, struct nfscldeleg *,
2029 sizeof (struct nfscldeleg) + NFSX_V4FHMAX,
2030 M_NFSCLDELEG, M_WAITOK);
2031 LIST_INIT(&dp->nfsdl_owner);
2032 LIST_INIT(&dp->nfsdl_lock);
2033 dp->nfsdl_clp = owp->nfsow_clp;
2034 newnfs_copyincred(cred, &dp->nfsdl_cred);
2035 nfscl_lockinit(&dp->nfsdl_rwlock);
2036 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2038 dp->nfsdl_stateid.seqid = *tl++;
2039 dp->nfsdl_stateid.other[0] = *tl++;
2040 dp->nfsdl_stateid.other[1] = *tl++;
2041 dp->nfsdl_stateid.other[2] = *tl++;
2042 ret = fxdr_unsigned(int, *tl);
2043 if (deleg == NFSV4OPEN_DELEGATEWRITE) {
2044 dp->nfsdl_flags = NFSCLDL_WRITE;
2046 * Indicates how much the file can grow.
2048 NFSM_DISSECT(tl, u_int32_t *,
2050 limitby = fxdr_unsigned(int, *tl++);
2052 case NFSV4OPEN_LIMITSIZE:
2053 dp->nfsdl_sizelimit = fxdr_hyper(tl);
2055 case NFSV4OPEN_LIMITBLOCKS:
2056 dp->nfsdl_sizelimit =
2057 fxdr_unsigned(u_int64_t, *tl++);
2058 dp->nfsdl_sizelimit *=
2059 fxdr_unsigned(u_int64_t, *tl);
2062 error = NFSERR_BADXDR;
2066 dp->nfsdl_flags = NFSCLDL_READ;
2069 dp->nfsdl_flags |= NFSCLDL_RECALL;
2070 error = nfsrv_dissectace(nd, &dp->nfsdl_ace, &ret,
2074 } else if (deleg != NFSV4OPEN_DELEGATENONE) {
2075 error = NFSERR_BADXDR;
2078 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2081 if (dp != NULL && *attrflagp) {
2082 dp->nfsdl_change = nnap->na_filerev;
2083 dp->nfsdl_modtime = nnap->na_mtime;
2084 dp->nfsdl_flags |= NFSCLDL_MODTIMESET;
2087 * We can now complete the Open state.
2091 dp->nfsdl_fhlen = nfhp->nfh_len;
2092 NFSBCOPY(nfhp->nfh_fh, dp->nfsdl_fh, nfhp->nfh_len);
2095 * Get an Open structure that will be
2096 * attached to the OpenOwner, acquired already.
2098 error = nfscl_open(dvp, nfhp->nfh_fh, nfhp->nfh_len,
2099 (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), 0,
2100 cred, p, NULL, &op, &newone, NULL, 0);
2103 op->nfso_stateid = stateid;
2104 newnfs_copyincred(cred, &op->nfso_cred);
2105 if ((rflags & NFSV4OPEN_RESULTCONFIRM)) {
2107 ret = nfsrpc_openconfirm(dvp, nfhp->nfh_fh,
2108 nfhp->nfh_len, op, cred, p);
2109 if (ret == NFSERR_DELAY)
2110 (void) nfs_catnap(PZERO, ret, "nfs_create");
2111 } while (ret == NFSERR_DELAY);
2116 * If the server is handing out delegations, but we didn't
2117 * get one because an OpenConfirm was required, try the
2118 * Open again, to get a delegation. This is a harmless no-op,
2119 * from a server's point of view.
2121 if ((rflags & NFSV4OPEN_RESULTCONFIRM) &&
2122 (owp->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG) &&
2123 !error && dp == NULL) {
2126 ret = nfsrpc_openrpc(VFSTONFS(vnode_mount(dvp)), dvp,
2127 np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
2128 nfhp->nfh_fh, nfhp->nfh_len,
2129 (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), op,
2130 name, namelen, &dp, 0, 0x0, cred, p, 0, 1);
2131 if (ret == NFSERR_DELAY)
2132 (void) nfs_catnap(PZERO, ret, "nfs_crt2");
2133 } while (ret == NFSERR_DELAY);
2136 FREE((caddr_t)dp, M_NFSCLDELEG);
2137 if (ret == NFSERR_STALECLIENTID ||
2138 ret == NFSERR_STALEDONTRECOVER ||
2139 ret == NFSERR_BADSESSION)
2143 nfscl_openrelease(op, error, newone);
2146 if (nd->nd_repstat != 0 && error == 0)
2147 error = nd->nd_repstat;
2148 if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
2149 nfscl_initiate_recovery(owp->nfsow_clp);
2153 else if (dp != NULL)
2154 FREE((caddr_t)dp, M_NFSCLDELEG);
2155 mbuf_freem(nd->nd_mrep);
2163 nfsrpc_remove(vnode_t dvp, char *name, int namelen, vnode_t vp,
2164 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp,
2168 struct nfsrv_descript nfsd, *nd = &nfsd;
2170 struct nfsmount *nmp;
2171 nfsv4stateid_t dstateid;
2172 int error, ret = 0, i;
2175 if (namelen > NFS_MAXNAMLEN)
2176 return (ENAMETOOLONG);
2177 nmp = VFSTONFS(vnode_mount(dvp));
2179 if (NFSHASNFSV4(nmp) && ret == 0) {
2180 ret = nfscl_removedeleg(vp, p, &dstateid);
2182 NFSCL_REQSTART(nd, NFSPROC_RETDELEGREMOVE, vp);
2183 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
2185 if (NFSHASNFSV4N(nmp))
2188 *tl++ = dstateid.seqid;
2189 *tl++ = dstateid.other[0];
2190 *tl++ = dstateid.other[1];
2191 *tl++ = dstateid.other[2];
2192 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2194 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2195 np->n_fhp->nfh_len, 0);
2196 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2197 *tl = txdr_unsigned(NFSV4OP_REMOVE);
2203 NFSCL_REQSTART(nd, NFSPROC_REMOVE, dvp);
2204 (void) nfsm_strtom(nd, name, namelen);
2205 error = nfscl_request(nd, dvp, p, cred, dstuff);
2208 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2209 /* For NFSv4, parse out any Delereturn replies. */
2210 if (ret > 0 && nd->nd_repstat != 0 &&
2211 (nd->nd_flag & ND_NOMOREDATA)) {
2213 * If the Delegreturn failed, try again without
2214 * it. The server will Recall, as required.
2216 mbuf_freem(nd->nd_mrep);
2219 for (i = 0; i < (ret * 2); i++) {
2220 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2222 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2224 nd->nd_flag |= ND_NOMOREDATA;
2227 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2229 if (nd->nd_repstat && !error)
2230 error = nd->nd_repstat;
2232 mbuf_freem(nd->nd_mrep);
2237 * Do an nfs rename rpc.
2240 nfsrpc_rename(vnode_t fdvp, vnode_t fvp, char *fnameptr, int fnamelen,
2241 vnode_t tdvp, vnode_t tvp, char *tnameptr, int tnamelen, struct ucred *cred,
2242 NFSPROC_T *p, struct nfsvattr *fnap, struct nfsvattr *tnap,
2243 int *fattrflagp, int *tattrflagp, void *fstuff, void *tstuff)
2246 struct nfsrv_descript nfsd, *nd = &nfsd;
2247 struct nfsmount *nmp;
2249 nfsattrbit_t attrbits;
2250 nfsv4stateid_t fdstateid, tdstateid;
2251 int error = 0, ret = 0, gottd = 0, gotfd = 0, i;
2255 nmp = VFSTONFS(vnode_mount(fdvp));
2256 if (fnamelen > NFS_MAXNAMLEN || tnamelen > NFS_MAXNAMLEN)
2257 return (ENAMETOOLONG);
2259 if (NFSHASNFSV4(nmp) && ret == 0) {
2260 ret = nfscl_renamedeleg(fvp, &fdstateid, &gotfd, tvp,
2261 &tdstateid, &gottd, p);
2262 if (gotfd && gottd) {
2263 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME2, fvp);
2265 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, fvp);
2267 NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, tvp);
2270 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2271 if (NFSHASNFSV4N(nmp))
2274 *tl++ = fdstateid.seqid;
2275 *tl++ = fdstateid.other[0];
2276 *tl++ = fdstateid.other[1];
2277 *tl = fdstateid.other[2];
2279 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2280 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2282 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2283 np->n_fhp->nfh_len, 0);
2284 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2285 *tl = txdr_unsigned(NFSV4OP_DELEGRETURN);
2289 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2290 if (NFSHASNFSV4N(nmp))
2293 *tl++ = tdstateid.seqid;
2294 *tl++ = tdstateid.other[0];
2295 *tl++ = tdstateid.other[1];
2296 *tl = tdstateid.other[2];
2299 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2300 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2302 (void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2303 np->n_fhp->nfh_len, 0);
2304 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2305 *tl = txdr_unsigned(NFSV4OP_SAVEFH);
2311 NFSCL_REQSTART(nd, NFSPROC_RENAME, fdvp);
2312 if (nd->nd_flag & ND_NFSV4) {
2313 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2314 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2315 NFSWCCATTR_ATTRBIT(&attrbits);
2316 (void) nfsrv_putattrbit(nd, &attrbits);
2317 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2318 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2319 (void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2320 VTONFS(tdvp)->n_fhp->nfh_len, 0);
2321 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2322 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2323 (void) nfsrv_putattrbit(nd, &attrbits);
2324 nd->nd_flag |= ND_V4WCCATTR;
2325 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2326 *tl = txdr_unsigned(NFSV4OP_RENAME);
2328 (void) nfsm_strtom(nd, fnameptr, fnamelen);
2329 if (!(nd->nd_flag & ND_NFSV4))
2330 (void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2331 VTONFS(tdvp)->n_fhp->nfh_len, 0);
2332 (void) nfsm_strtom(nd, tnameptr, tnamelen);
2333 error = nfscl_request(nd, fdvp, p, cred, fstuff);
2336 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2337 /* For NFSv4, parse out any Delereturn replies. */
2338 if (ret > 0 && nd->nd_repstat != 0 &&
2339 (nd->nd_flag & ND_NOMOREDATA)) {
2341 * If the Delegreturn failed, try again without
2342 * it. The server will Recall, as required.
2344 mbuf_freem(nd->nd_mrep);
2347 for (i = 0; i < (ret * 2); i++) {
2348 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2350 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2352 if (i == 0 && ret > 1) {
2354 * If the Delegreturn failed, try again
2355 * without it. The server will Recall, as
2357 * If ret > 1, the first iteration of this
2358 * loop is the second DelegReturn result.
2360 mbuf_freem(nd->nd_mrep);
2363 nd->nd_flag |= ND_NOMOREDATA;
2368 /* Now, the first wcc attribute reply. */
2369 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2370 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2372 nd->nd_flag |= ND_NOMOREDATA;
2374 error = nfscl_wcc_data(nd, fdvp, fnap, fattrflagp, NULL,
2376 /* and the second wcc attribute reply. */
2377 if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4 &&
2379 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2381 nd->nd_flag |= ND_NOMOREDATA;
2384 error = nfscl_wcc_data(nd, tdvp, tnap, tattrflagp,
2387 if (nd->nd_repstat && !error)
2388 error = nd->nd_repstat;
2390 mbuf_freem(nd->nd_mrep);
2395 * nfs hard link create rpc
2398 nfsrpc_link(vnode_t dvp, vnode_t vp, char *name, int namelen,
2399 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2400 struct nfsvattr *nap, int *attrflagp, int *dattrflagp, void *dstuff)
2403 struct nfsrv_descript nfsd, *nd = &nfsd;
2404 nfsattrbit_t attrbits;
2409 if (namelen > NFS_MAXNAMLEN)
2410 return (ENAMETOOLONG);
2411 NFSCL_REQSTART(nd, NFSPROC_LINK, vp);
2412 if (nd->nd_flag & ND_NFSV4) {
2413 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2414 *tl = txdr_unsigned(NFSV4OP_PUTFH);
2416 (void) nfsm_fhtom(nd, VTONFS(dvp)->n_fhp->nfh_fh,
2417 VTONFS(dvp)->n_fhp->nfh_len, 0);
2418 if (nd->nd_flag & ND_NFSV4) {
2419 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2420 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2421 NFSWCCATTR_ATTRBIT(&attrbits);
2422 (void) nfsrv_putattrbit(nd, &attrbits);
2423 nd->nd_flag |= ND_V4WCCATTR;
2424 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2425 *tl = txdr_unsigned(NFSV4OP_LINK);
2427 (void) nfsm_strtom(nd, name, namelen);
2428 error = nfscl_request(nd, vp, p, cred, dstuff);
2431 if (nd->nd_flag & ND_NFSV3) {
2432 error = nfscl_postop_attr(nd, nap, attrflagp, dstuff);
2434 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2436 } else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2438 * First, parse out the PutFH and Getattr result.
2440 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2442 NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2444 nd->nd_flag |= ND_NOMOREDATA;
2446 * Get the pre-op attributes.
2448 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2450 if (nd->nd_repstat && !error)
2451 error = nd->nd_repstat;
2453 mbuf_freem(nd->nd_mrep);
2458 * nfs symbolic link create rpc
2461 nfsrpc_symlink(vnode_t dvp, char *name, int namelen, char *target,
2462 struct vattr *vap, struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2463 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2464 int *dattrflagp, void *dstuff)
2467 struct nfsrv_descript nfsd, *nd = &nfsd;
2468 struct nfsmount *nmp;
2469 int slen, error = 0;
2474 nmp = VFSTONFS(vnode_mount(dvp));
2475 slen = strlen(target);
2476 if (slen > NFS_MAXPATHLEN || namelen > NFS_MAXNAMLEN)
2477 return (ENAMETOOLONG);
2478 NFSCL_REQSTART(nd, NFSPROC_SYMLINK, dvp);
2479 if (nd->nd_flag & ND_NFSV4) {
2480 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2481 *tl = txdr_unsigned(NFLNK);
2482 (void) nfsm_strtom(nd, target, slen);
2484 (void) nfsm_strtom(nd, name, namelen);
2485 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2486 nfscl_fillsattr(nd, vap, dvp, 0, 0);
2487 if (!(nd->nd_flag & ND_NFSV4))
2488 (void) nfsm_strtom(nd, target, slen);
2489 if (nd->nd_flag & ND_NFSV2)
2490 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2491 error = nfscl_request(nd, dvp, p, cred, dstuff);
2494 if (nd->nd_flag & ND_NFSV4)
2495 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2496 if ((nd->nd_flag & ND_NFSV3) && !error) {
2497 if (!nd->nd_repstat)
2498 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2500 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2503 if (nd->nd_repstat && !error)
2504 error = nd->nd_repstat;
2505 mbuf_freem(nd->nd_mrep);
2507 * Kludge: Map EEXIST => 0 assuming that it is a reply to a retry.
2509 if (error == EEXIST)
2518 nfsrpc_mkdir(vnode_t dvp, char *name, int namelen, struct vattr *vap,
2519 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2520 struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2521 int *dattrflagp, void *dstuff)
2524 struct nfsrv_descript nfsd, *nd = &nfsd;
2525 nfsattrbit_t attrbits;
2531 if (namelen > NFS_MAXNAMLEN)
2532 return (ENAMETOOLONG);
2533 NFSCL_REQSTART(nd, NFSPROC_MKDIR, dvp);
2534 if (nd->nd_flag & ND_NFSV4) {
2535 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2536 *tl = txdr_unsigned(NFDIR);
2538 (void) nfsm_strtom(nd, name, namelen);
2539 nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2540 if (nd->nd_flag & ND_NFSV4) {
2541 NFSGETATTR_ATTRBIT(&attrbits);
2542 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2543 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2544 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2545 (void) nfsrv_putattrbit(nd, &attrbits);
2547 error = nfscl_request(nd, dvp, p, cred, dstuff);
2550 if (nd->nd_flag & ND_NFSV4)
2551 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2552 if (!nd->nd_repstat && !error) {
2553 if (nd->nd_flag & ND_NFSV4) {
2554 NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2555 error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2558 error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2560 if ((nd->nd_flag & ND_NFSV3) && !error)
2561 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2562 if (nd->nd_repstat && !error)
2563 error = nd->nd_repstat;
2565 mbuf_freem(nd->nd_mrep);
2567 * Kludge: Map EEXIST => 0 assuming that you have a reply to a retry.
2569 if (error == EEXIST)
2575 * nfs remove directory call
2578 nfsrpc_rmdir(vnode_t dvp, char *name, int namelen, struct ucred *cred,
2579 NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp, void *dstuff)
2581 struct nfsrv_descript nfsd, *nd = &nfsd;
2585 if (namelen > NFS_MAXNAMLEN)
2586 return (ENAMETOOLONG);
2587 NFSCL_REQSTART(nd, NFSPROC_RMDIR, dvp);
2588 (void) nfsm_strtom(nd, name, namelen);
2589 error = nfscl_request(nd, dvp, p, cred, dstuff);
2592 if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2593 error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2594 if (nd->nd_repstat && !error)
2595 error = nd->nd_repstat;
2596 mbuf_freem(nd->nd_mrep);
2598 * Kludge: Map ENOENT => 0 assuming that you have a reply to a retry.
2600 if (error == ENOENT)
2607 * Always returns with either uio_resid unchanged, if you are at the
2608 * end of the directory, or uio_resid == 0, with all DIRBLKSIZ chunks
2610 * I felt this would allow caching of directory blocks more easily
2611 * than returning a pertially filled block.
2612 * Directory offset cookies:
2613 * Oh my, what to do with them...
2614 * I can think of three ways to deal with them:
2615 * 1 - have the layer above these RPCs maintain a map between logical
2616 * directory byte offsets and the NFS directory offset cookies
2617 * 2 - pass the opaque directory offset cookies up into userland
2618 * and let the libc functions deal with them, via the system call
2619 * 3 - return them to userland in the "struct dirent", so future versions
2620 * of libc can use them and do whatever is necessary to amke things work
2621 * above these rpc calls, in the meantime
2622 * For now, I do #3 by "hiding" the directory offset cookies after the
2623 * d_name field in struct dirent. This is space inside d_reclen that
2624 * will be ignored by anything that doesn't know about them.
2625 * The directory offset cookies are filled in as the last 8 bytes of
2626 * each directory entry, after d_name. Someday, the userland libc
2627 * functions may be able to use these. In the meantime, it satisfies
2628 * OpenBSD's requirements for cookies being returned.
2629 * If expects the directory offset cookie for the read to be in uio_offset
2630 * and returns the one for the next entry after this directory block in
2634 nfsrpc_readdir(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
2635 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
2636 int *eofp, void *stuff)
2639 struct dirent *dp = NULL;
2641 nfsquad_t cookie, ncookie;
2642 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
2643 struct nfsnode *dnp = VTONFS(vp);
2644 struct nfsvattr nfsva;
2645 struct nfsrv_descript nfsd, *nd = &nfsd;
2646 int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
2647 int reqsize, tryformoredirs = 1, readsize, eof = 0, gotmnton = 0;
2648 long dotfileid, dotdotfileid = 0;
2649 u_int32_t fakefileno = 0xffffffff, rderr;
2651 nfsattrbit_t attrbits, dattrbits;
2652 u_int32_t *tl2 = NULL;
2655 KASSERT(uiop->uio_iovcnt == 1 &&
2656 (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
2657 ("nfs readdirrpc bad uio"));
2660 * There is no point in reading a lot more than uio_resid, however
2661 * adding one additional DIRBLKSIZ makes sense. Since uio_resid
2662 * and nm_readdirsize are both exact multiples of DIRBLKSIZ, this
2663 * will never make readsize > nm_readdirsize.
2665 readsize = nmp->nm_readdirsize;
2666 if (readsize > uio_uio_resid(uiop))
2667 readsize = uio_uio_resid(uiop) + DIRBLKSIZ;
2672 tresid = uio_uio_resid(uiop);
2673 cookie.lval[0] = cookiep->nfsuquad[0];
2674 cookie.lval[1] = cookiep->nfsuquad[1];
2678 * For NFSv4, first create the "." and ".." entries.
2680 if (NFSHASNFSV4(nmp)) {
2681 reqsize = 6 * NFSX_UNSIGNED;
2682 NFSGETATTR_ATTRBIT(&dattrbits);
2683 NFSZERO_ATTRBIT(&attrbits);
2684 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
2685 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TYPE);
2686 if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
2687 NFSATTRBIT_MOUNTEDONFILEID)) {
2688 NFSSETBIT_ATTRBIT(&attrbits,
2689 NFSATTRBIT_MOUNTEDONFILEID);
2693 * Must fake it. Use the fileno, except when the
2694 * fsid is != to that of the directory. For that
2695 * case, generate a fake fileno that is not the same.
2697 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
2702 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
2704 if (uiop->uio_offset == 0) {
2705 #if defined(__FreeBSD_version) && __FreeBSD_version >= 800000
2706 error = VOP_GETATTR(vp, &nfsva.na_vattr, cred);
2708 error = VOP_GETATTR(vp, &nfsva.na_vattr, cred, p);
2712 dotfileid = nfsva.na_fileid;
2713 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
2714 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2715 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
2716 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2717 (void) nfsrv_putattrbit(nd, &attrbits);
2718 error = nfscl_request(nd, vp, p, cred, stuff);
2721 if (nd->nd_repstat == 0) {
2722 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2723 len = fxdr_unsigned(int, *(tl + 2));
2724 if (len > 0 && len <= NFSX_V4FHMAX)
2725 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2729 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2730 nfsva.na_mntonfileno = 0xffffffff;
2731 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2732 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2733 NULL, NULL, NULL, p, cred);
2735 dotdotfileid = dotfileid;
2736 } else if (gotmnton) {
2737 if (nfsva.na_mntonfileno != 0xffffffff)
2738 dotdotfileid = nfsva.na_mntonfileno;
2740 dotdotfileid = nfsva.na_fileid;
2741 } else if (nfsva.na_filesid[0] ==
2742 dnp->n_vattr.na_filesid[0] &&
2743 nfsva.na_filesid[1] ==
2744 dnp->n_vattr.na_filesid[1]) {
2745 dotdotfileid = nfsva.na_fileid;
2749 } while (fakefileno ==
2751 dotdotfileid = fakefileno;
2754 } else if (nd->nd_repstat == NFSERR_NOENT) {
2756 * Lookupp returns NFSERR_NOENT when we are
2757 * at the root, so just use the current dir.
2760 dotdotfileid = dotfileid;
2762 error = nd->nd_repstat;
2764 mbuf_freem(nd->nd_mrep);
2768 dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2769 dp->d_type = DT_DIR;
2770 dp->d_fileno = dotfileid;
2772 dp->d_name[0] = '.';
2773 dp->d_name[1] = '\0';
2774 dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2776 * Just make these offset cookie 0.
2778 tl = (u_int32_t *)&dp->d_name[4];
2781 blksiz += dp->d_reclen;
2782 uio_uio_resid_add(uiop, -(dp->d_reclen));
2783 uiop->uio_offset += dp->d_reclen;
2784 uio_iov_base_add(uiop, dp->d_reclen);
2785 uio_iov_len_add(uiop, -(dp->d_reclen));
2786 dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2787 dp->d_type = DT_DIR;
2788 dp->d_fileno = dotdotfileid;
2790 dp->d_name[0] = '.';
2791 dp->d_name[1] = '.';
2792 dp->d_name[2] = '\0';
2793 dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2795 * Just make these offset cookie 0.
2797 tl = (u_int32_t *)&dp->d_name[4];
2800 blksiz += dp->d_reclen;
2801 uio_uio_resid_add(uiop, -(dp->d_reclen));
2802 uiop->uio_offset += dp->d_reclen;
2803 uio_iov_base_add(uiop, dp->d_reclen);
2804 uio_iov_len_add(uiop, -(dp->d_reclen));
2806 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_RDATTRERROR);
2808 reqsize = 5 * NFSX_UNSIGNED;
2813 * Loop around doing readdir rpc's of size readsize.
2814 * The stopping criteria is EOF or buffer full.
2816 while (more_dirs && bigenough) {
2818 NFSCL_REQSTART(nd, NFSPROC_READDIR, vp);
2819 if (nd->nd_flag & ND_NFSV2) {
2820 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2821 *tl++ = cookie.lval[1];
2822 *tl = txdr_unsigned(readsize);
2824 NFSM_BUILD(tl, u_int32_t *, reqsize);
2825 *tl++ = cookie.lval[0];
2826 *tl++ = cookie.lval[1];
2827 if (cookie.qval == 0) {
2832 *tl++ = dnp->n_cookieverf.nfsuquad[0];
2833 *tl++ = dnp->n_cookieverf.nfsuquad[1];
2836 if (nd->nd_flag & ND_NFSV4) {
2837 *tl++ = txdr_unsigned(readsize);
2838 *tl = txdr_unsigned(readsize);
2839 (void) nfsrv_putattrbit(nd, &attrbits);
2840 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2841 *tl = txdr_unsigned(NFSV4OP_GETATTR);
2842 (void) nfsrv_putattrbit(nd, &dattrbits);
2844 *tl = txdr_unsigned(readsize);
2847 error = nfscl_request(nd, vp, p, cred, stuff);
2850 if (!(nd->nd_flag & ND_NFSV2)) {
2851 if (nd->nd_flag & ND_NFSV3)
2852 error = nfscl_postop_attr(nd, nap, attrflagp,
2854 if (!nd->nd_repstat && !error) {
2855 NFSM_DISSECT(tl, u_int32_t *, NFSX_HYPER);
2857 dnp->n_cookieverf.nfsuquad[0] = *tl++;
2858 dnp->n_cookieverf.nfsuquad[1] = *tl;
2862 if (nd->nd_repstat || error) {
2864 error = nd->nd_repstat;
2867 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2868 more_dirs = fxdr_unsigned(int, *tl);
2872 /* loop thru the dir entries, doctoring them to 4bsd form */
2873 while (more_dirs && bigenough) {
2874 if (nd->nd_flag & ND_NFSV4) {
2875 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2876 ncookie.lval[0] = *tl++;
2877 ncookie.lval[1] = *tl++;
2878 len = fxdr_unsigned(int, *tl);
2879 } else if (nd->nd_flag & ND_NFSV3) {
2880 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2881 nfsva.na_fileid = fxdr_hyper(tl);
2883 len = fxdr_unsigned(int, *tl);
2885 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2887 fxdr_unsigned(long, *tl++);
2888 len = fxdr_unsigned(int, *tl);
2890 if (len <= 0 || len > NFS_MAXNAMLEN) {
2894 tlen = NFSM_RNDUP(len);
2896 tlen += 4; /* To ensure null termination */
2897 left = DIRBLKSIZ - blksiz;
2898 if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > left) {
2899 dp->d_reclen += left;
2900 uio_iov_base_add(uiop, left);
2901 uio_iov_len_add(uiop, -(left));
2902 uio_uio_resid_add(uiop, -(left));
2903 uiop->uio_offset += left;
2906 if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
2909 dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2911 dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
2912 dp->d_type = DT_UNKNOWN;
2913 blksiz += dp->d_reclen;
2914 if (blksiz == DIRBLKSIZ)
2916 uio_uio_resid_add(uiop, -(DIRHDSIZ));
2917 uiop->uio_offset += DIRHDSIZ;
2918 uio_iov_base_add(uiop, DIRHDSIZ);
2919 uio_iov_len_add(uiop, -(DIRHDSIZ));
2920 error = nfsm_mbufuio(nd, uiop, len);
2923 cp = CAST_DOWN(caddr_t, uio_iov_base(uiop));
2925 *cp = '\0'; /* null terminate */
2926 cp += tlen; /* points to cookie storage */
2927 tl2 = (u_int32_t *)cp;
2928 uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
2929 uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
2930 uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
2931 uiop->uio_offset += (tlen + NFSX_HYPER);
2933 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2937 if (nd->nd_flag & ND_NFSV4) {
2939 nfsva.na_mntonfileno = 0xffffffff;
2940 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2941 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2942 NULL, NULL, &rderr, p, cred);
2945 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2946 } else if (nd->nd_flag & ND_NFSV3) {
2947 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2948 ncookie.lval[0] = *tl++;
2949 ncookie.lval[1] = *tl++;
2951 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2952 ncookie.lval[0] = 0;
2953 ncookie.lval[1] = *tl++;
2956 if (nd->nd_flag & ND_NFSV4) {
2961 if (nfsva.na_mntonfileno != 0xffffffff)
2962 dp->d_fileno = nfsva.na_mntonfileno;
2964 dp->d_fileno = nfsva.na_fileid;
2965 } else if (nfsva.na_filesid[0] ==
2966 dnp->n_vattr.na_filesid[0] &&
2967 nfsva.na_filesid[1] ==
2968 dnp->n_vattr.na_filesid[1]) {
2969 dp->d_fileno = nfsva.na_fileid;
2973 } while (fakefileno ==
2975 dp->d_fileno = fakefileno;
2977 dp->d_type = vtonfs_dtype(nfsva.na_type);
2980 dp->d_fileno = nfsva.na_fileid;
2982 *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
2984 *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
2987 more_dirs = fxdr_unsigned(int, *tl);
2990 * If at end of rpc data, get the eof boolean
2993 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2994 eof = fxdr_unsigned(int, *tl);
2997 if (nd->nd_flag & ND_NFSV4) {
2998 error = nfscl_postop_attr(nd, nap, attrflagp,
3004 mbuf_freem(nd->nd_mrep);
3008 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3009 * by increasing d_reclen for the last record.
3012 left = DIRBLKSIZ - blksiz;
3013 dp->d_reclen += left;
3014 uio_iov_base_add(uiop, left);
3015 uio_iov_len_add(uiop, -(left));
3016 uio_uio_resid_add(uiop, -(left));
3017 uiop->uio_offset += left;
3021 * If returning no data, assume end of file.
3022 * If not bigenough, return not end of file, since you aren't
3023 * returning all the data
3024 * Otherwise, return the eof flag from the server.
3027 if (tresid == ((size_t)(uio_uio_resid(uiop))))
3029 else if (!bigenough)
3036 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3038 while (uio_uio_resid(uiop) > 0 && ((size_t)(uio_uio_resid(uiop))) != tresid) {
3039 dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
3040 dp->d_type = DT_UNKNOWN;
3043 dp->d_name[0] = '\0';
3044 tl = (u_int32_t *)&dp->d_name[4];
3045 *tl++ = cookie.lval[0];
3046 *tl = cookie.lval[1];
3047 dp->d_reclen = DIRBLKSIZ;
3048 uio_iov_base_add(uiop, DIRBLKSIZ);
3049 uio_iov_len_add(uiop, -(DIRBLKSIZ));
3050 uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3051 uiop->uio_offset += DIRBLKSIZ;
3055 if (nd->nd_mrep != NULL)
3056 mbuf_freem(nd->nd_mrep);
3062 * NFS V3 readdir plus RPC. Used in place of nfsrpc_readdir().
3063 * (Also used for NFS V4 when mount flag set.)
3064 * (ditto above w.r.t. multiple of DIRBLKSIZ, etc.)
3067 nfsrpc_readdirplus(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
3068 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3069 int *eofp, void *stuff)
3072 struct dirent *dp = NULL;
3074 vnode_t newvp = NULLVP;
3075 struct nfsrv_descript nfsd, *nd = &nfsd;
3076 struct nameidata nami, *ndp = &nami;
3077 struct componentname *cnp = &ndp->ni_cnd;
3078 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3079 struct nfsnode *dnp = VTONFS(vp), *np;
3080 struct nfsvattr nfsva;
3082 nfsquad_t cookie, ncookie;
3083 int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
3084 int attrflag, tryformoredirs = 1, eof = 0, gotmnton = 0;
3085 int isdotdot = 0, unlocknewvp = 0;
3086 long dotfileid, dotdotfileid = 0, fileno = 0;
3088 nfsattrbit_t attrbits, dattrbits;
3090 u_int32_t *tl2 = NULL, fakefileno = 0xffffffff, rderr;
3091 struct timespec dctime;
3093 KASSERT(uiop->uio_iovcnt == 1 &&
3094 (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
3095 ("nfs readdirplusrpc bad uio"));
3096 timespecclear(&dctime);
3102 cookie.lval[0] = cookiep->nfsuquad[0];
3103 cookie.lval[1] = cookiep->nfsuquad[1];
3104 tresid = uio_uio_resid(uiop);
3107 * For NFSv4, first create the "." and ".." entries.
3109 if (NFSHASNFSV4(nmp)) {
3110 NFSGETATTR_ATTRBIT(&dattrbits);
3111 NFSZERO_ATTRBIT(&attrbits);
3112 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
3113 if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
3114 NFSATTRBIT_MOUNTEDONFILEID)) {
3115 NFSSETBIT_ATTRBIT(&attrbits,
3116 NFSATTRBIT_MOUNTEDONFILEID);
3120 * Must fake it. Use the fileno, except when the
3121 * fsid is != to that of the directory. For that
3122 * case, generate a fake fileno that is not the same.
3124 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
3129 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
3131 if (uiop->uio_offset == 0) {
3132 #if defined(__FreeBSD_version) && __FreeBSD_version >= 800000
3133 error = VOP_GETATTR(vp, &nfsva.na_vattr, cred);
3135 error = VOP_GETATTR(vp, &nfsva.na_vattr, cred, p);
3139 dctime = nfsva.na_ctime;
3140 dotfileid = nfsva.na_fileid;
3141 NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
3142 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
3143 *tl++ = txdr_unsigned(NFSV4OP_GETFH);
3144 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3145 (void) nfsrv_putattrbit(nd, &attrbits);
3146 error = nfscl_request(nd, vp, p, cred, stuff);
3149 if (nd->nd_repstat == 0) {
3150 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3151 len = fxdr_unsigned(int, *(tl + 2));
3152 if (len > 0 && len <= NFSX_V4FHMAX)
3153 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3157 NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
3158 nfsva.na_mntonfileno = 0xffffffff;
3159 error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
3160 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3161 NULL, NULL, NULL, p, cred);
3163 dotdotfileid = dotfileid;
3164 } else if (gotmnton) {
3165 if (nfsva.na_mntonfileno != 0xffffffff)
3166 dotdotfileid = nfsva.na_mntonfileno;
3168 dotdotfileid = nfsva.na_fileid;
3169 } else if (nfsva.na_filesid[0] ==
3170 dnp->n_vattr.na_filesid[0] &&
3171 nfsva.na_filesid[1] ==
3172 dnp->n_vattr.na_filesid[1]) {
3173 dotdotfileid = nfsva.na_fileid;
3177 } while (fakefileno ==
3179 dotdotfileid = fakefileno;
3182 } else if (nd->nd_repstat == NFSERR_NOENT) {
3184 * Lookupp returns NFSERR_NOENT when we are
3185 * at the root, so just use the current dir.
3188 dotdotfileid = dotfileid;
3190 error = nd->nd_repstat;
3192 mbuf_freem(nd->nd_mrep);
3196 dp = (struct dirent *)uio_iov_base(uiop);
3197 dp->d_type = DT_DIR;
3198 dp->d_fileno = dotfileid;
3200 dp->d_name[0] = '.';
3201 dp->d_name[1] = '\0';
3202 dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3204 * Just make these offset cookie 0.
3206 tl = (u_int32_t *)&dp->d_name[4];
3209 blksiz += dp->d_reclen;
3210 uio_uio_resid_add(uiop, -(dp->d_reclen));
3211 uiop->uio_offset += dp->d_reclen;
3212 uio_iov_base_add(uiop, dp->d_reclen);
3213 uio_iov_len_add(uiop, -(dp->d_reclen));
3214 dp = (struct dirent *)uio_iov_base(uiop);
3215 dp->d_type = DT_DIR;
3216 dp->d_fileno = dotdotfileid;
3218 dp->d_name[0] = '.';
3219 dp->d_name[1] = '.';
3220 dp->d_name[2] = '\0';
3221 dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3223 * Just make these offset cookie 0.
3225 tl = (u_int32_t *)&dp->d_name[4];
3228 blksiz += dp->d_reclen;
3229 uio_uio_resid_add(uiop, -(dp->d_reclen));
3230 uiop->uio_offset += dp->d_reclen;
3231 uio_iov_base_add(uiop, dp->d_reclen);
3232 uio_iov_len_add(uiop, -(dp->d_reclen));
3234 NFSREADDIRPLUS_ATTRBIT(&attrbits);
3236 NFSSETBIT_ATTRBIT(&attrbits,
3237 NFSATTRBIT_MOUNTEDONFILEID);
3241 * Loop around doing readdir rpc's of size nm_readdirsize.
3242 * The stopping criteria is EOF or buffer full.
3244 while (more_dirs && bigenough) {
3246 NFSCL_REQSTART(nd, NFSPROC_READDIRPLUS, vp);
3247 NFSM_BUILD(tl, u_int32_t *, 6 * NFSX_UNSIGNED);
3248 *tl++ = cookie.lval[0];
3249 *tl++ = cookie.lval[1];
3250 if (cookie.qval == 0) {
3255 *tl++ = dnp->n_cookieverf.nfsuquad[0];
3256 *tl++ = dnp->n_cookieverf.nfsuquad[1];
3259 *tl++ = txdr_unsigned(nmp->nm_readdirsize);
3260 *tl = txdr_unsigned(nmp->nm_readdirsize);
3261 if (nd->nd_flag & ND_NFSV4) {
3262 (void) nfsrv_putattrbit(nd, &attrbits);
3263 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3264 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3265 (void) nfsrv_putattrbit(nd, &dattrbits);
3267 error = nfscl_request(nd, vp, p, cred, stuff);
3270 if (nd->nd_flag & ND_NFSV3)
3271 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3272 if (nd->nd_repstat || error) {
3274 error = nd->nd_repstat;
3277 if ((nd->nd_flag & ND_NFSV3) != 0 && *attrflagp != 0)
3278 dctime = nap->na_ctime;
3279 NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3281 dnp->n_cookieverf.nfsuquad[0] = *tl++;
3282 dnp->n_cookieverf.nfsuquad[1] = *tl++;
3284 more_dirs = fxdr_unsigned(int, *tl);
3288 /* loop thru the dir entries, doctoring them to 4bsd form */
3289 while (more_dirs && bigenough) {
3290 NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3291 if (nd->nd_flag & ND_NFSV4) {
3292 ncookie.lval[0] = *tl++;
3293 ncookie.lval[1] = *tl++;
3295 fileno = fxdr_unsigned(long, *++tl);
3298 len = fxdr_unsigned(int, *tl);
3299 if (len <= 0 || len > NFS_MAXNAMLEN) {
3303 tlen = NFSM_RNDUP(len);
3305 tlen += 4; /* To ensure null termination */
3306 left = DIRBLKSIZ - blksiz;
3307 if ((tlen + DIRHDSIZ + NFSX_HYPER) > left) {
3308 dp->d_reclen += left;
3309 uio_iov_base_add(uiop, left);
3310 uio_iov_len_add(uiop, -(left));
3311 uio_uio_resid_add(uiop, -(left));
3312 uiop->uio_offset += left;
3315 if ((tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
3318 dp = (struct dirent *)uio_iov_base(uiop);
3320 dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
3321 dp->d_type = DT_UNKNOWN;
3322 blksiz += dp->d_reclen;
3323 if (blksiz == DIRBLKSIZ)
3325 uio_uio_resid_add(uiop, -(DIRHDSIZ));
3326 uiop->uio_offset += DIRHDSIZ;
3327 uio_iov_base_add(uiop, DIRHDSIZ);
3328 uio_iov_len_add(uiop, -(DIRHDSIZ));
3329 cnp->cn_nameptr = uio_iov_base(uiop);
3330 cnp->cn_namelen = len;
3332 error = nfsm_mbufuio(nd, uiop, len);
3335 cp = uio_iov_base(uiop);
3338 cp += tlen; /* points to cookie storage */
3339 tl2 = (u_int32_t *)cp;
3340 if (len == 2 && cnp->cn_nameptr[0] == '.' &&
3341 cnp->cn_nameptr[1] == '.')
3345 uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
3346 uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
3347 uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
3348 uiop->uio_offset += (tlen + NFSX_HYPER);
3350 error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3355 if (nd->nd_flag & ND_NFSV3) {
3356 NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3357 ncookie.lval[0] = *tl++;
3358 ncookie.lval[1] = *tl++;
3359 attrflag = fxdr_unsigned(int, *tl);
3361 error = nfsm_loadattr(nd, &nfsva);
3365 NFSM_DISSECT(tl,u_int32_t *,NFSX_UNSIGNED);
3367 error = nfsm_getfh(nd, &nfhp);
3371 if (!attrflag && nfhp != NULL) {
3372 FREE((caddr_t)nfhp, M_NFSFH);
3377 nfsva.na_mntonfileno = 0xffffffff;
3378 error = nfsv4_loadattr(nd, NULL, &nfsva, &nfhp,
3379 NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3380 NULL, NULL, &rderr, p, cred);
3386 if (nd->nd_flag & ND_NFSV4) {
3389 } else if (gotmnton) {
3390 if (nfsva.na_mntonfileno != 0xffffffff)
3391 dp->d_fileno = nfsva.na_mntonfileno;
3393 dp->d_fileno = nfsva.na_fileid;
3394 } else if (nfsva.na_filesid[0] ==
3395 dnp->n_vattr.na_filesid[0] &&
3396 nfsva.na_filesid[1] ==
3397 dnp->n_vattr.na_filesid[1]) {
3398 dp->d_fileno = nfsva.na_fileid;
3402 } while (fakefileno ==
3404 dp->d_fileno = fakefileno;
3407 dp->d_fileno = fileno;
3409 *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3411 *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3415 if (NFSRV_CMPFH(nfhp->nfh_fh, nfhp->nfh_len,
3416 dnp->n_fhp->nfh_fh, dnp->n_fhp->nfh_len)) {
3420 FREE((caddr_t)nfhp, M_NFSFH);
3422 } else if (isdotdot != 0) {
3424 * Skip doing a nfscl_nget() call for "..".
3425 * There's a race between acquiring the nfs
3426 * node here and lookups that look for the
3427 * directory being read (in the parent).
3428 * It would try to get a lock on ".." here,
3429 * owning the lock on the directory being
3430 * read. Lookup will hold the lock on ".."
3431 * and try to acquire the lock on the
3432 * directory being read.
3433 * If the directory is unlocked/relocked,
3434 * then there is a LOR with the buflock
3437 free(nfhp, M_NFSFH);
3439 error = nfscl_nget(vnode_mount(vp), vp,
3440 nfhp, cnp, p, &np, NULL, LK_EXCLUSIVE);
3447 if (newvp != NULLVP) {
3448 error = nfscl_loadattrcache(&newvp,
3449 &nfsva, NULL, NULL, 0, 0);
3458 vtonfs_dtype(np->n_vattr.na_type);
3460 NFSCNHASH(cnp, HASHINIT);
3461 if (cnp->cn_namelen <= NCHNAMLEN &&
3462 (newvp->v_type != VDIR ||
3463 dctime.tv_sec != 0)) {
3464 cache_enter_time(ndp->ni_dvp,
3467 newvp->v_type != VDIR ? NULL :
3477 } else if (nfhp != NULL) {
3478 FREE((caddr_t)nfhp, M_NFSFH);
3480 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3481 more_dirs = fxdr_unsigned(int, *tl);
3484 * If at end of rpc data, get the eof boolean
3487 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3488 eof = fxdr_unsigned(int, *tl);
3491 if (nd->nd_flag & ND_NFSV4) {
3492 error = nfscl_postop_attr(nd, nap, attrflagp,
3498 mbuf_freem(nd->nd_mrep);
3502 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3503 * by increasing d_reclen for the last record.
3506 left = DIRBLKSIZ - blksiz;
3507 dp->d_reclen += left;
3508 uio_iov_base_add(uiop, left);
3509 uio_iov_len_add(uiop, -(left));
3510 uio_uio_resid_add(uiop, -(left));
3511 uiop->uio_offset += left;
3515 * If returning no data, assume end of file.
3516 * If not bigenough, return not end of file, since you aren't
3517 * returning all the data
3518 * Otherwise, return the eof flag from the server.
3521 if (tresid == uio_uio_resid(uiop))
3523 else if (!bigenough)
3530 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3532 while (uio_uio_resid(uiop) > 0 && uio_uio_resid(uiop) != tresid) {
3533 dp = (struct dirent *)uio_iov_base(uiop);
3534 dp->d_type = DT_UNKNOWN;
3537 dp->d_name[0] = '\0';
3538 tl = (u_int32_t *)&dp->d_name[4];
3539 *tl++ = cookie.lval[0];
3540 *tl = cookie.lval[1];
3541 dp->d_reclen = DIRBLKSIZ;
3542 uio_iov_base_add(uiop, DIRBLKSIZ);
3543 uio_iov_len_add(uiop, -(DIRBLKSIZ));
3544 uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3545 uiop->uio_offset += DIRBLKSIZ;
3549 if (nd->nd_mrep != NULL)
3550 mbuf_freem(nd->nd_mrep);
3559 nfsrpc_commit(vnode_t vp, u_quad_t offset, int cnt, struct ucred *cred,
3560 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
3563 struct nfsrv_descript nfsd, *nd = &nfsd;
3564 nfsattrbit_t attrbits;
3566 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3569 NFSCL_REQSTART(nd, NFSPROC_COMMIT, vp);
3570 NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3571 txdr_hyper(offset, tl);
3573 *tl = txdr_unsigned(cnt);
3574 if (nd->nd_flag & ND_NFSV4) {
3576 * And do a Getattr op.
3578 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3579 *tl = txdr_unsigned(NFSV4OP_GETATTR);
3580 NFSGETATTR_ATTRBIT(&attrbits);
3581 (void) nfsrv_putattrbit(nd, &attrbits);
3583 error = nfscl_request(nd, vp, p, cred, stuff);
3586 error = nfscl_wcc_data(nd, vp, nap, attrflagp, NULL, stuff);
3587 if (!error && !nd->nd_repstat) {
3588 NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
3590 if (NFSBCMP(nmp->nm_verf, tl, NFSX_VERF)) {
3591 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
3592 nd->nd_repstat = NFSERR_STALEWRITEVERF;
3595 if (nd->nd_flag & ND_NFSV4)
3596 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3599 if (!error && nd->nd_repstat)
3600 error = nd->nd_repstat;
3601 mbuf_freem(nd->nd_mrep);
3606 * NFS byte range lock rpc.
3607 * (Mostly just calls one of the three lower level RPC routines.)
3610 nfsrpc_advlock(vnode_t vp, off_t size, int op, struct flock *fl,
3611 int reclaim, struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3613 struct nfscllockowner *lp;
3614 struct nfsclclient *clp;
3616 struct nfsrv_descript nfsd, *nd = &nfsd;
3617 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3620 u_int32_t clidrev = 0;
3621 int error = 0, newone = 0, expireret = 0, retrycnt, donelocally;
3625 * Convert the flock structure into a start and end and do POSIX
3628 switch (fl->l_whence) {
3632 * Caller is responsible for adding any necessary offset
3633 * when SEEK_CUR is used.
3635 start = fl->l_start;
3639 start = size + fl->l_start;
3640 off = size + fl->l_start;
3647 if (fl->l_len != 0) {
3648 end = start + fl->l_len - 1;
3659 if (op == F_GETLK) {
3660 error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3663 error = nfscl_lockt(vp, clp, off, len, fl, p, id, flags);
3665 clidrev = clp->nfsc_clientidrev;
3666 error = nfsrpc_lockt(nd, vp, clp, off, len, fl, cred,
3668 } else if (error == -1) {
3671 nfscl_clientrelease(clp);
3672 } else if (op == F_UNLCK && fl->l_type == F_UNLCK) {
3674 * We must loop around for all lockowner cases.
3677 error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3681 error = nfscl_relbytelock(vp, off, len, cred, p, callcnt,
3682 clp, id, flags, &lp, &dorpc);
3684 * If it returns a NULL lp, we're done.
3688 nfscl_clientrelease(clp);
3690 nfscl_releasealllocks(clp, vp, p, id, flags);
3693 if (nmp->nm_clp != NULL)
3694 clidrev = nmp->nm_clp->nfsc_clientidrev;
3698 * If the server doesn't support Posix lock semantics,
3699 * only allow locks on the entire file, since it won't
3700 * handle overlapping byte ranges.
3701 * There might still be a problem when a lock
3702 * upgrade/downgrade (read<->write) occurs, since the
3703 * server "might" expect an unlock first?
3705 if (dorpc && (lp->nfsl_open->nfso_posixlock ||
3706 (off == 0 && len == NFS64BITSSET))) {
3708 * Since the lock records will go away, we must
3709 * wait for grace and delay here.
3712 error = nfsrpc_locku(nd, nmp, lp, off, len,
3713 NFSV4LOCKT_READ, cred, p, 0);
3714 if ((nd->nd_repstat == NFSERR_GRACE ||
3715 nd->nd_repstat == NFSERR_DELAY) &&
3717 (void) nfs_catnap(PZERO, (int)nd->nd_repstat,
3719 } while ((nd->nd_repstat == NFSERR_GRACE ||
3720 nd->nd_repstat == NFSERR_DELAY) && error == 0);
3723 } while (error == 0 && nd->nd_repstat == 0);
3724 nfscl_releasealllocks(clp, vp, p, id, flags);
3725 } else if (op == F_SETLK) {
3726 error = nfscl_getbytelock(vp, off, len, fl->l_type, cred, p,
3727 NULL, 0, id, flags, NULL, NULL, &lp, &newone, &donelocally);
3728 if (error || donelocally) {
3731 if (nmp->nm_clp != NULL)
3732 clidrev = nmp->nm_clp->nfsc_clientidrev;
3735 nfhp = VTONFS(vp)->n_fhp;
3736 if (!lp->nfsl_open->nfso_posixlock &&
3737 (off != 0 || len != NFS64BITSSET)) {
3740 error = nfsrpc_lock(nd, nmp, vp, nfhp->nfh_fh,
3741 nfhp->nfh_len, lp, newone, reclaim, off,
3742 len, fl->l_type, cred, p, 0);
3745 error = nd->nd_repstat;
3746 nfscl_lockrelease(lp, error, newone);
3751 error = nd->nd_repstat;
3752 if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
3753 error == NFSERR_STALEDONTRECOVER ||
3754 error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3755 error == NFSERR_BADSESSION) {
3756 (void) nfs_catnap(PZERO, error, "nfs_advlock");
3757 } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
3759 expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
3762 } while (error == NFSERR_GRACE ||
3763 error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3764 error == NFSERR_STALEDONTRECOVER || error == NFSERR_STALESTATEID ||
3765 error == NFSERR_BADSESSION ||
3766 ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
3767 expireret == 0 && clidrev != 0 && retrycnt < 4));
3768 if (error && retrycnt >= 4)
3774 * The lower level routine for the LockT case.
3777 nfsrpc_lockt(struct nfsrv_descript *nd, vnode_t vp,
3778 struct nfsclclient *clp, u_int64_t off, u_int64_t len, struct flock *fl,
3779 struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3782 int error, type, size;
3783 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3785 struct nfsmount *nmp;
3787 nmp = VFSTONFS(vp->v_mount);
3788 NFSCL_REQSTART(nd, NFSPROC_LOCKT, vp);
3789 NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3790 if (fl->l_type == F_RDLCK)
3791 *tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3793 *tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3794 txdr_hyper(off, tl);
3796 txdr_hyper(len, tl);
3798 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3799 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3800 nfscl_filllockowner(id, own, flags);
3802 NFSBCOPY(np->n_fhp->nfh_fh, &own[NFSV4CL_LOCKNAMELEN],
3803 np->n_fhp->nfh_len);
3804 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + np->n_fhp->nfh_len);
3805 error = nfscl_request(nd, vp, p, cred, NULL);
3808 if (nd->nd_repstat == 0) {
3809 fl->l_type = F_UNLCK;
3810 } else if (nd->nd_repstat == NFSERR_DENIED) {
3812 fl->l_whence = SEEK_SET;
3813 NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3814 fl->l_start = fxdr_hyper(tl);
3816 len = fxdr_hyper(tl);
3818 if (len == NFS64BITSSET)
3822 type = fxdr_unsigned(int, *tl++);
3823 if (type == NFSV4LOCKT_WRITE)
3824 fl->l_type = F_WRLCK;
3826 fl->l_type = F_RDLCK;
3828 * XXX For now, I have no idea what to do with the
3829 * conflicting lock_owner, so I'll just set the pid == 0
3830 * and skip over the lock_owner.
3832 fl->l_pid = (pid_t)0;
3834 size = fxdr_unsigned(int, *tl);
3835 if (size < 0 || size > NFSV4_OPAQUELIMIT)
3838 error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3839 } else if (nd->nd_repstat == NFSERR_STALECLIENTID ||
3840 nd->nd_repstat == NFSERR_BADSESSION)
3841 nfscl_initiate_recovery(clp);
3843 mbuf_freem(nd->nd_mrep);
3848 * Lower level function that performs the LockU RPC.
3851 nfsrpc_locku(struct nfsrv_descript *nd, struct nfsmount *nmp,
3852 struct nfscllockowner *lp, u_int64_t off, u_int64_t len,
3853 u_int32_t type, struct ucred *cred, NFSPROC_T *p, int syscred)
3858 nfscl_reqstart(nd, NFSPROC_LOCKU, nmp, lp->nfsl_open->nfso_fh,
3859 lp->nfsl_open->nfso_fhlen, NULL, NULL);
3860 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 6 * NFSX_UNSIGNED);
3861 *tl++ = txdr_unsigned(type);
3862 *tl = txdr_unsigned(lp->nfsl_seqid);
3863 if (nfstest_outofseq &&
3864 (arc4random() % nfstest_outofseq) == 0)
3865 *tl = txdr_unsigned(lp->nfsl_seqid + 1);
3867 if (NFSHASNFSV4N(nmp))
3870 *tl++ = lp->nfsl_stateid.seqid;
3871 *tl++ = lp->nfsl_stateid.other[0];
3872 *tl++ = lp->nfsl_stateid.other[1];
3873 *tl++ = lp->nfsl_stateid.other[2];
3874 txdr_hyper(off, tl);
3876 txdr_hyper(len, tl);
3878 nd->nd_flag |= ND_USEGSSNAME;
3879 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
3880 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3881 NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3884 if (nd->nd_repstat == 0) {
3885 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3886 lp->nfsl_stateid.seqid = *tl++;
3887 lp->nfsl_stateid.other[0] = *tl++;
3888 lp->nfsl_stateid.other[1] = *tl++;
3889 lp->nfsl_stateid.other[2] = *tl;
3890 } else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3891 nd->nd_repstat == NFSERR_BADSESSION)
3892 nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3894 mbuf_freem(nd->nd_mrep);
3899 * The actual Lock RPC.
3902 nfsrpc_lock(struct nfsrv_descript *nd, struct nfsmount *nmp, vnode_t vp,
3903 u_int8_t *nfhp, int fhlen, struct nfscllockowner *lp, int newone,
3904 int reclaim, u_int64_t off, u_int64_t len, short type, struct ucred *cred,
3905 NFSPROC_T *p, int syscred)
3909 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3911 nfscl_reqstart(nd, NFSPROC_LOCK, nmp, nfhp, fhlen, NULL, NULL);
3912 NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3913 if (type == F_RDLCK)
3914 *tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3916 *tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3917 *tl++ = txdr_unsigned(reclaim);
3918 txdr_hyper(off, tl);
3920 txdr_hyper(len, tl);
3924 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
3925 2 * NFSX_UNSIGNED + NFSX_HYPER);
3926 *tl++ = txdr_unsigned(lp->nfsl_open->nfso_own->nfsow_seqid);
3927 if (NFSHASNFSV4N(nmp))
3930 *tl++ = lp->nfsl_open->nfso_stateid.seqid;
3931 *tl++ = lp->nfsl_open->nfso_stateid.other[0];
3932 *tl++ = lp->nfsl_open->nfso_stateid.other[1];
3933 *tl++ = lp->nfsl_open->nfso_stateid.other[2];
3934 *tl++ = txdr_unsigned(lp->nfsl_seqid);
3935 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3936 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3937 NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
3938 NFSBCOPY(nfhp, &own[NFSV4CL_LOCKNAMELEN], fhlen);
3939 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
3942 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + NFSX_UNSIGNED);
3943 if (NFSHASNFSV4N(nmp))
3946 *tl++ = lp->nfsl_stateid.seqid;
3947 *tl++ = lp->nfsl_stateid.other[0];
3948 *tl++ = lp->nfsl_stateid.other[1];
3949 *tl++ = lp->nfsl_stateid.other[2];
3950 *tl = txdr_unsigned(lp->nfsl_seqid);
3951 if (nfstest_outofseq &&
3952 (arc4random() % nfstest_outofseq) == 0)
3953 *tl = txdr_unsigned(lp->nfsl_seqid + 1);
3956 nd->nd_flag |= ND_USEGSSNAME;
3957 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
3958 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3962 NFSCL_INCRSEQID(lp->nfsl_open->nfso_own->nfsow_seqid, nd);
3963 NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3964 if (nd->nd_repstat == 0) {
3965 NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3966 lp->nfsl_stateid.seqid = *tl++;
3967 lp->nfsl_stateid.other[0] = *tl++;
3968 lp->nfsl_stateid.other[1] = *tl++;
3969 lp->nfsl_stateid.other[2] = *tl;
3970 } else if (nd->nd_repstat == NFSERR_DENIED) {
3971 NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3972 size = fxdr_unsigned(int, *(tl + 7));
3973 if (size < 0 || size > NFSV4_OPAQUELIMIT)
3976 error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3977 } else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3978 nd->nd_repstat == NFSERR_BADSESSION)
3979 nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3981 mbuf_freem(nd->nd_mrep);
3987 * (always called with the vp for the mount point)
3990 nfsrpc_statfs(vnode_t vp, struct nfsstatfs *sbp, struct nfsfsinfo *fsp,
3991 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3994 u_int32_t *tl = NULL;
3995 struct nfsrv_descript nfsd, *nd = &nfsd;
3996 struct nfsmount *nmp;
3997 nfsattrbit_t attrbits;
4001 nmp = VFSTONFS(vnode_mount(vp));
4002 if (NFSHASNFSV4(nmp)) {
4004 * For V4, you actually do a getattr.
4006 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4007 NFSSTATFS_GETATTRBIT(&attrbits);
4008 (void) nfsrv_putattrbit(nd, &attrbits);
4009 nd->nd_flag |= ND_USEGSSNAME;
4010 error = nfscl_request(nd, vp, p, cred, stuff);
4013 if (nd->nd_repstat == 0) {
4014 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4015 NULL, NULL, sbp, fsp, NULL, 0, NULL, NULL, NULL, p,
4018 nmp->nm_fsid[0] = nap->na_filesid[0];
4019 nmp->nm_fsid[1] = nap->na_filesid[1];
4020 NFSSETHASSETFSID(nmp);
4024 error = nd->nd_repstat;
4029 NFSCL_REQSTART(nd, NFSPROC_FSSTAT, vp);
4030 error = nfscl_request(nd, vp, p, cred, stuff);
4033 if (nd->nd_flag & ND_NFSV3) {
4034 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4038 if (nd->nd_repstat) {
4039 error = nd->nd_repstat;
4042 NFSM_DISSECT(tl, u_int32_t *,
4043 NFSX_STATFS(nd->nd_flag & ND_NFSV3));
4045 if (NFSHASNFSV3(nmp)) {
4046 sbp->sf_tbytes = fxdr_hyper(tl); tl += 2;
4047 sbp->sf_fbytes = fxdr_hyper(tl); tl += 2;
4048 sbp->sf_abytes = fxdr_hyper(tl); tl += 2;
4049 sbp->sf_tfiles = fxdr_hyper(tl); tl += 2;
4050 sbp->sf_ffiles = fxdr_hyper(tl); tl += 2;
4051 sbp->sf_afiles = fxdr_hyper(tl); tl += 2;
4052 sbp->sf_invarsec = fxdr_unsigned(u_int32_t, *tl);
4053 } else if (NFSHASNFSV4(nmp) == 0) {
4054 sbp->sf_tsize = fxdr_unsigned(u_int32_t, *tl++);
4055 sbp->sf_bsize = fxdr_unsigned(u_int32_t, *tl++);
4056 sbp->sf_blocks = fxdr_unsigned(u_int32_t, *tl++);
4057 sbp->sf_bfree = fxdr_unsigned(u_int32_t, *tl++);
4058 sbp->sf_bavail = fxdr_unsigned(u_int32_t, *tl);
4061 mbuf_freem(nd->nd_mrep);
4069 nfsrpc_pathconf(vnode_t vp, struct nfsv3_pathconf *pc,
4070 struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4073 struct nfsrv_descript nfsd, *nd = &nfsd;
4074 struct nfsmount *nmp;
4076 nfsattrbit_t attrbits;
4080 nmp = VFSTONFS(vnode_mount(vp));
4081 if (NFSHASNFSV4(nmp)) {
4083 * For V4, you actually do a getattr.
4085 NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4086 NFSPATHCONF_GETATTRBIT(&attrbits);
4087 (void) nfsrv_putattrbit(nd, &attrbits);
4088 nd->nd_flag |= ND_USEGSSNAME;
4089 error = nfscl_request(nd, vp, p, cred, stuff);
4092 if (nd->nd_repstat == 0) {
4093 error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4094 pc, NULL, NULL, NULL, NULL, 0, NULL, NULL, NULL, p,
4099 error = nd->nd_repstat;
4102 NFSCL_REQSTART(nd, NFSPROC_PATHCONF, vp);
4103 error = nfscl_request(nd, vp, p, cred, stuff);
4106 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4107 if (nd->nd_repstat && !error)
4108 error = nd->nd_repstat;
4110 NFSM_DISSECT(tl, u_int32_t *, NFSX_V3PATHCONF);
4111 pc->pc_linkmax = fxdr_unsigned(u_int32_t, *tl++);
4112 pc->pc_namemax = fxdr_unsigned(u_int32_t, *tl++);
4113 pc->pc_notrunc = fxdr_unsigned(u_int32_t, *tl++);
4114 pc->pc_chownrestricted =
4115 fxdr_unsigned(u_int32_t, *tl++);
4116 pc->pc_caseinsensitive =
4117 fxdr_unsigned(u_int32_t, *tl++);
4118 pc->pc_casepreserving = fxdr_unsigned(u_int32_t, *tl);
4122 mbuf_freem(nd->nd_mrep);
4127 * nfs version 3 fsinfo rpc call
4130 nfsrpc_fsinfo(vnode_t vp, struct nfsfsinfo *fsp, struct ucred *cred,
4131 NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
4134 struct nfsrv_descript nfsd, *nd = &nfsd;
4138 NFSCL_REQSTART(nd, NFSPROC_FSINFO, vp);
4139 error = nfscl_request(nd, vp, p, cred, stuff);
4142 error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4143 if (nd->nd_repstat && !error)
4144 error = nd->nd_repstat;
4146 NFSM_DISSECT(tl, u_int32_t *, NFSX_V3FSINFO);
4147 fsp->fs_rtmax = fxdr_unsigned(u_int32_t, *tl++);
4148 fsp->fs_rtpref = fxdr_unsigned(u_int32_t, *tl++);
4149 fsp->fs_rtmult = fxdr_unsigned(u_int32_t, *tl++);
4150 fsp->fs_wtmax = fxdr_unsigned(u_int32_t, *tl++);
4151 fsp->fs_wtpref = fxdr_unsigned(u_int32_t, *tl++);
4152 fsp->fs_wtmult = fxdr_unsigned(u_int32_t, *tl++);
4153 fsp->fs_dtpref = fxdr_unsigned(u_int32_t, *tl++);
4154 fsp->fs_maxfilesize = fxdr_hyper(tl);
4156 fxdr_nfsv3time(tl, &fsp->fs_timedelta);
4158 fsp->fs_properties = fxdr_unsigned(u_int32_t, *tl);
4161 mbuf_freem(nd->nd_mrep);
4166 * This function performs the Renew RPC.
4169 nfsrpc_renew(struct nfsclclient *clp, struct nfsclds *dsp, struct ucred *cred,
4173 struct nfsrv_descript nfsd;
4174 struct nfsrv_descript *nd = &nfsd;
4175 struct nfsmount *nmp;
4177 struct nfssockreq *nrp;
4179 nmp = clp->nfsc_nmp;
4182 nfscl_reqstart(nd, NFSPROC_RENEW, nmp, NULL, 0, NULL,
4183 &dsp->nfsclds_sess);
4184 if (!NFSHASNFSV4N(nmp)) {
4185 /* NFSv4.1 just uses a Sequence Op and not a Renew. */
4186 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4187 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4188 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4190 nrp = dsp->nfsclds_sockp;
4192 /* If NULL, use the MDS socket. */
4193 nrp = &nmp->nm_sockreq;
4194 nd->nd_flag |= ND_USEGSSNAME;
4195 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4196 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
4199 error = nd->nd_repstat;
4200 mbuf_freem(nd->nd_mrep);
4205 * This function performs the Releaselockowner RPC.
4208 nfsrpc_rellockown(struct nfsmount *nmp, struct nfscllockowner *lp,
4209 uint8_t *fh, int fhlen, struct ucred *cred, NFSPROC_T *p)
4211 struct nfsrv_descript nfsd, *nd = &nfsd;
4214 uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
4216 if (NFSHASNFSV4N(nmp)) {
4217 /* For NFSv4.1, do a FreeStateID. */
4218 nfscl_reqstart(nd, NFSPROC_FREESTATEID, nmp, NULL, 0, NULL,
4220 nfsm_stateidtom(nd, &lp->nfsl_stateid, NFSSTATEID_PUTSTATEID);
4222 nfscl_reqstart(nd, NFSPROC_RELEASELCKOWN, nmp, NULL, 0, NULL,
4224 NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4225 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4226 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4227 NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
4228 NFSBCOPY(fh, &own[NFSV4CL_LOCKNAMELEN], fhlen);
4229 (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
4231 nd->nd_flag |= ND_USEGSSNAME;
4232 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4233 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4236 error = nd->nd_repstat;
4237 mbuf_freem(nd->nd_mrep);
4242 * This function performs the Compound to get the mount pt FH.
4245 nfsrpc_getdirpath(struct nfsmount *nmp, u_char *dirpath, struct ucred *cred,
4249 struct nfsrv_descript nfsd;
4250 struct nfsrv_descript *nd = &nfsd;
4252 int error, cnt, len, setnil;
4255 nfscl_reqstart(nd, NFSPROC_PUTROOTFH, nmp, NULL, 0, &opcntp, NULL);
4263 while (*cp2 != '\0' && *cp2 != '/')
4270 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4271 *tl = txdr_unsigned(NFSV4OP_LOOKUP);
4272 nfsm_strtom(nd, cp, strlen(cp));
4278 } while (*cp != '\0');
4279 if (NFSHASNFSV4N(nmp))
4280 /* Has a Sequence Op done by nfscl_reqstart(). */
4281 *opcntp = txdr_unsigned(3 + cnt);
4283 *opcntp = txdr_unsigned(2 + cnt);
4284 NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4285 *tl = txdr_unsigned(NFSV4OP_GETFH);
4286 nd->nd_flag |= ND_USEGSSNAME;
4287 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4288 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4291 if (nd->nd_repstat == 0) {
4292 NFSM_DISSECT(tl, u_int32_t *, (3 + 2 * cnt) * NFSX_UNSIGNED);
4293 tl += (2 + 2 * cnt);
4294 if ((len = fxdr_unsigned(int, *tl)) <= 0 ||
4296 nd->nd_repstat = NFSERR_BADXDR;
4298 nd->nd_repstat = nfsrv_mtostr(nd, nmp->nm_fh, len);
4299 if (nd->nd_repstat == 0)
4300 nmp->nm_fhsize = len;
4303 error = nd->nd_repstat;
4305 mbuf_freem(nd->nd_mrep);
4310 * This function performs the Delegreturn RPC.
4313 nfsrpc_delegreturn(struct nfscldeleg *dp, struct ucred *cred,
4314 struct nfsmount *nmp, NFSPROC_T *p, int syscred)
4317 struct nfsrv_descript nfsd;
4318 struct nfsrv_descript *nd = &nfsd;
4321 nfscl_reqstart(nd, NFSPROC_DELEGRETURN, nmp, dp->nfsdl_fh,
4322 dp->nfsdl_fhlen, NULL, NULL);
4323 NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
4324 if (NFSHASNFSV4N(nmp))
4327 *tl++ = dp->nfsdl_stateid.seqid;
4328 *tl++ = dp->nfsdl_stateid.other[0];
4329 *tl++ = dp->nfsdl_stateid.other[1];
4330 *tl = dp->nfsdl_stateid.other[2];
4332 nd->nd_flag |= ND_USEGSSNAME;
4333 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4334 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4337 error = nd->nd_repstat;
4338 mbuf_freem(nd->nd_mrep);
4346 nfsrpc_getacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4347 struct acl *aclp, void *stuff)
4349 struct nfsrv_descript nfsd, *nd = &nfsd;
4351 nfsattrbit_t attrbits;
4352 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4354 if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4355 return (EOPNOTSUPP);
4356 NFSCL_REQSTART(nd, NFSPROC_GETACL, vp);
4357 NFSZERO_ATTRBIT(&attrbits);
4358 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4359 (void) nfsrv_putattrbit(nd, &attrbits);
4360 error = nfscl_request(nd, vp, p, cred, stuff);
4363 if (!nd->nd_repstat)
4364 error = nfsv4_loadattr(nd, vp, NULL, NULL, NULL, 0, NULL,
4365 NULL, NULL, NULL, aclp, 0, NULL, NULL, NULL, p, cred);
4367 error = nd->nd_repstat;
4368 mbuf_freem(nd->nd_mrep);
4376 nfsrpc_setacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4377 struct acl *aclp, void *stuff)
4380 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4382 if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4383 return (EOPNOTSUPP);
4384 error = nfsrpc_setattr(vp, NULL, aclp, cred, p, NULL, NULL, stuff);
4392 nfsrpc_setaclrpc(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4393 struct acl *aclp, nfsv4stateid_t *stateidp, void *stuff)
4395 struct nfsrv_descript nfsd, *nd = &nfsd;
4397 nfsattrbit_t attrbits;
4398 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4400 if (!NFSHASNFSV4(nmp))
4401 return (EOPNOTSUPP);
4402 NFSCL_REQSTART(nd, NFSPROC_SETACL, vp);
4403 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
4404 NFSZERO_ATTRBIT(&attrbits);
4405 NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4406 (void) nfsv4_fillattr(nd, vnode_mount(vp), vp, aclp, NULL, NULL, 0,
4407 &attrbits, NULL, NULL, 0, 0, 0, 0, (uint64_t)0);
4408 error = nfscl_request(nd, vp, p, cred, stuff);
4411 /* Don't care about the pre/postop attributes */
4412 mbuf_freem(nd->nd_mrep);
4413 return (nd->nd_repstat);
4417 * Do the NFSv4.1 Exchange ID.
4420 nfsrpc_exchangeid(struct nfsmount *nmp, struct nfsclclient *clp,
4421 struct nfssockreq *nrp, uint32_t exchflags, struct nfsclds **dspp,
4422 struct ucred *cred, NFSPROC_T *p)
4424 uint32_t *tl, v41flags;
4425 struct nfsrv_descript nfsd;
4426 struct nfsrv_descript *nd = &nfsd;
4427 struct nfsclds *dsp;
4428 struct timespec verstime;
4432 nfscl_reqstart(nd, NFSPROC_EXCHANGEID, nmp, NULL, 0, NULL, NULL);
4433 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4434 *tl++ = txdr_unsigned(nfsboottime.tv_sec); /* Client owner */
4435 *tl = txdr_unsigned(clp->nfsc_rev);
4436 (void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
4438 NFSM_BUILD(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4439 *tl++ = txdr_unsigned(exchflags);
4440 *tl++ = txdr_unsigned(NFSV4EXCH_SP4NONE);
4442 /* Set the implementation id4 */
4443 *tl = txdr_unsigned(1);
4444 (void) nfsm_strtom(nd, "freebsd.org", strlen("freebsd.org"));
4445 (void) nfsm_strtom(nd, version, strlen(version));
4446 NFSM_BUILD(tl, uint32_t *, NFSX_V4TIME);
4447 verstime.tv_sec = 1293840000; /* Jan 1, 2011 */
4448 verstime.tv_nsec = 0;
4449 txdr_nfsv4time(&verstime, tl);
4450 nd->nd_flag |= ND_USEGSSNAME;
4451 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4452 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4453 NFSCL_DEBUG(1, "exchangeid err=%d reps=%d\n", error,
4454 (int)nd->nd_repstat);
4457 if (nd->nd_repstat == 0) {
4458 NFSM_DISSECT(tl, uint32_t *, 6 * NFSX_UNSIGNED + NFSX_HYPER);
4459 len = fxdr_unsigned(int, *(tl + 7));
4460 if (len < 0 || len > NFSV4_OPAQUELIMIT) {
4461 error = NFSERR_BADXDR;
4464 dsp = malloc(sizeof(struct nfsclds) + len, M_NFSCLDS,
4466 dsp->nfsclds_expire = NFSD_MONOSEC + clp->nfsc_renew;
4467 dsp->nfsclds_servownlen = len;
4468 dsp->nfsclds_sess.nfsess_clientid.lval[0] = *tl++;
4469 dsp->nfsclds_sess.nfsess_clientid.lval[1] = *tl++;
4470 dsp->nfsclds_sess.nfsess_sequenceid =
4471 fxdr_unsigned(uint32_t, *tl++);
4472 v41flags = fxdr_unsigned(uint32_t, *tl);
4473 if ((v41flags & NFSV4EXCH_USEPNFSMDS) != 0 &&
4474 NFSHASPNFSOPT(nmp)) {
4475 NFSCL_DEBUG(1, "set PNFS\n");
4477 nmp->nm_state |= NFSSTA_PNFS;
4479 dsp->nfsclds_flags |= NFSCLDS_MDS;
4481 if ((v41flags & NFSV4EXCH_USEPNFSDS) != 0)
4482 dsp->nfsclds_flags |= NFSCLDS_DS;
4484 nd->nd_repstat = nfsrv_mtostr(nd,
4485 dsp->nfsclds_serverown, len);
4486 if (nd->nd_repstat == 0) {
4487 mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
4488 mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession",
4490 nfscl_initsessionslots(&dsp->nfsclds_sess);
4493 free(dsp, M_NFSCLDS);
4495 error = nd->nd_repstat;
4497 mbuf_freem(nd->nd_mrep);
4502 * Do the NFSv4.1 Create Session.
4505 nfsrpc_createsession(struct nfsmount *nmp, struct nfsclsession *sep,
4506 struct nfssockreq *nrp, uint32_t sequenceid, int mds, struct ucred *cred,
4509 uint32_t crflags, *tl;
4510 struct nfsrv_descript nfsd;
4511 struct nfsrv_descript *nd = &nfsd;
4514 nfscl_reqstart(nd, NFSPROC_CREATESESSION, nmp, NULL, 0, NULL, NULL);
4515 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
4516 *tl++ = sep->nfsess_clientid.lval[0];
4517 *tl++ = sep->nfsess_clientid.lval[1];
4518 *tl++ = txdr_unsigned(sequenceid);
4519 crflags = (NFSMNT_RDONLY(nmp->nm_mountp) ? 0 : NFSV4CRSESS_PERSIST);
4520 if (nfscl_enablecallb != 0 && nfs_numnfscbd > 0)
4521 crflags |= NFSV4CRSESS_CONNBACKCHAN;
4522 *tl = txdr_unsigned(crflags);
4524 /* Fill in fore channel attributes. */
4525 NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4526 *tl++ = 0; /* Header pad size */
4527 *tl++ = txdr_unsigned(100000); /* Max request size */
4528 *tl++ = txdr_unsigned(100000); /* Max response size */
4529 *tl++ = txdr_unsigned(4096); /* Max response size cached */
4530 *tl++ = txdr_unsigned(20); /* Max operations */
4531 *tl++ = txdr_unsigned(64); /* Max slots */
4532 *tl = 0; /* No rdma ird */
4534 /* Fill in back channel attributes. */
4535 NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4536 *tl++ = 0; /* Header pad size */
4537 *tl++ = txdr_unsigned(10000); /* Max request size */
4538 *tl++ = txdr_unsigned(10000); /* Max response size */
4539 *tl++ = txdr_unsigned(4096); /* Max response size cached */
4540 *tl++ = txdr_unsigned(4); /* Max operations */
4541 *tl++ = txdr_unsigned(NFSV4_CBSLOTS); /* Max slots */
4542 *tl = 0; /* No rdma ird */
4544 NFSM_BUILD(tl, uint32_t *, 8 * NFSX_UNSIGNED);
4545 *tl++ = txdr_unsigned(NFS_CALLBCKPROG); /* Call back prog # */
4547 /* Allow AUTH_SYS callbacks as uid, gid == 0. */
4548 *tl++ = txdr_unsigned(1); /* Auth_sys only */
4549 *tl++ = txdr_unsigned(AUTH_SYS); /* AUTH_SYS type */
4550 *tl++ = txdr_unsigned(nfsboottime.tv_sec); /* time stamp */
4551 *tl++ = 0; /* Null machine name */
4552 *tl++ = 0; /* Uid == 0 */
4553 *tl++ = 0; /* Gid == 0 */
4554 *tl = 0; /* No additional gids */
4555 nd->nd_flag |= ND_USEGSSNAME;
4556 error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred, NFS_PROG,
4557 NFS_VER4, NULL, 1, NULL, NULL);
4560 if (nd->nd_repstat == 0) {
4561 NFSM_DISSECT(tl, uint32_t *, NFSX_V4SESSIONID +
4563 bcopy(tl, sep->nfsess_sessionid, NFSX_V4SESSIONID);
4564 tl += NFSX_V4SESSIONID / NFSX_UNSIGNED;
4565 sep->nfsess_sequenceid = fxdr_unsigned(uint32_t, *tl++);
4566 crflags = fxdr_unsigned(uint32_t, *tl);
4567 if ((crflags & NFSV4CRSESS_PERSIST) != 0 && mds != 0) {
4569 nmp->nm_state |= NFSSTA_SESSPERSIST;
4573 /* Get the fore channel slot count. */
4574 NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4575 tl += 3; /* Skip the other counts. */
4576 sep->nfsess_maxcache = fxdr_unsigned(int, *tl++);
4578 sep->nfsess_foreslots = fxdr_unsigned(uint16_t, *tl++);
4579 NFSCL_DEBUG(4, "fore slots=%d\n", (int)sep->nfsess_foreslots);
4580 irdcnt = fxdr_unsigned(int, *tl);
4582 NFSM_DISSECT(tl, uint32_t *, irdcnt * NFSX_UNSIGNED);
4584 /* and the back channel slot count. */
4585 NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4587 sep->nfsess_backslots = fxdr_unsigned(uint16_t, *tl);
4588 NFSCL_DEBUG(4, "back slots=%d\n", (int)sep->nfsess_backslots);
4590 error = nd->nd_repstat;
4592 mbuf_freem(nd->nd_mrep);
4597 * Do the NFSv4.1 Destroy Session.
4600 nfsrpc_destroysession(struct nfsmount *nmp, struct nfsclclient *clp,
4601 struct ucred *cred, NFSPROC_T *p)
4604 struct nfsrv_descript nfsd;
4605 struct nfsrv_descript *nd = &nfsd;
4608 nfscl_reqstart(nd, NFSPROC_DESTROYSESSION, nmp, NULL, 0, NULL, NULL);
4609 NFSM_BUILD(tl, uint32_t *, NFSX_V4SESSIONID);
4610 bcopy(NFSMNT_MDSSESSION(nmp)->nfsess_sessionid, tl, NFSX_V4SESSIONID);
4611 nd->nd_flag |= ND_USEGSSNAME;
4612 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4613 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4616 error = nd->nd_repstat;
4617 mbuf_freem(nd->nd_mrep);
4622 * Do the NFSv4.1 Destroy Client.
4625 nfsrpc_destroyclient(struct nfsmount *nmp, struct nfsclclient *clp,
4626 struct ucred *cred, NFSPROC_T *p)
4629 struct nfsrv_descript nfsd;
4630 struct nfsrv_descript *nd = &nfsd;
4633 nfscl_reqstart(nd, NFSPROC_DESTROYCLIENT, nmp, NULL, 0, NULL, NULL);
4634 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4635 *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4636 *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4637 nd->nd_flag |= ND_USEGSSNAME;
4638 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4639 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4642 error = nd->nd_repstat;
4643 mbuf_freem(nd->nd_mrep);
4648 * Do the NFSv4.1 LayoutGet.
4651 nfsrpc_layoutget(struct nfsmount *nmp, uint8_t *fhp, int fhlen, int iomode,
4652 uint64_t offset, uint64_t len, uint64_t minlen, int layoutlen,
4653 nfsv4stateid_t *stateidp, int *retonclosep, struct nfsclflayouthead *flhp,
4654 struct ucred *cred, NFSPROC_T *p, void *stuff)
4657 struct nfsrv_descript nfsd, *nd = &nfsd;
4659 struct nfsclflayout *flp, *prevflp, *tflp;
4660 int cnt, error, gotiomode, fhcnt, nfhlen, i, j;
4666 nfscl_reqstart(nd, NFSPROC_LAYOUTGET, nmp, fhp, fhlen, NULL, NULL);
4667 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4669 *tl++ = newnfs_false; /* Don't signal availability. */
4670 *tl++ = txdr_unsigned(NFSLAYOUT_NFSV4_1_FILES);
4671 *tl++ = txdr_unsigned(iomode);
4672 txdr_hyper(offset, tl);
4674 txdr_hyper(len, tl);
4676 txdr_hyper(minlen, tl);
4678 *tl++ = txdr_unsigned(stateidp->seqid);
4679 NFSCL_DEBUG(4, "layget seq=%d\n", (int)stateidp->seqid);
4680 *tl++ = stateidp->other[0];
4681 *tl++ = stateidp->other[1];
4682 *tl++ = stateidp->other[2];
4683 *tl = txdr_unsigned(layoutlen);
4684 nd->nd_flag |= ND_USEGSSNAME;
4685 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4686 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4689 if (nd->nd_repstat == 0) {
4690 NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_STATEID);
4695 stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
4696 NFSCL_DEBUG(4, "retoncls=%d stseq=%d\n", *retonclosep,
4697 (int)stateidp->seqid);
4698 stateidp->other[0] = *tl++;
4699 stateidp->other[1] = *tl++;
4700 stateidp->other[2] = *tl++;
4701 cnt = fxdr_unsigned(int, *tl);
4702 NFSCL_DEBUG(4, "layg cnt=%d\n", cnt);
4703 if (cnt <= 0 || cnt > 10000) {
4704 /* Don't accept more than 10000 layouts in reply. */
4705 error = NFSERR_BADXDR;
4708 for (i = 0; i < cnt; i++) {
4709 /* Dissect all the way to the file handle cnt. */
4710 NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_HYPER +
4711 6 * NFSX_UNSIGNED + NFSX_V4DEVICEID);
4712 fhcnt = fxdr_unsigned(int, *(tl + 11 +
4713 NFSX_V4DEVICEID / NFSX_UNSIGNED));
4714 NFSCL_DEBUG(4, "fhcnt=%d\n", fhcnt);
4715 if (fhcnt < 0 || fhcnt > 100) {
4716 /* Don't accept more than 100 file handles. */
4717 error = NFSERR_BADXDR;
4721 flp = malloc(sizeof(*flp) + (fhcnt - 1) *
4722 sizeof(struct nfsfh *),
4723 M_NFSFLAYOUT, M_WAITOK);
4725 flp = malloc(sizeof(*flp),
4726 M_NFSFLAYOUT, M_WAITOK);
4727 flp->nfsfl_flags = 0;
4728 flp->nfsfl_fhcnt = 0;
4729 flp->nfsfl_devp = NULL;
4730 flp->nfsfl_off = fxdr_hyper(tl); tl += 2;
4731 retlen = fxdr_hyper(tl); tl += 2;
4732 if (flp->nfsfl_off + retlen < flp->nfsfl_off)
4733 flp->nfsfl_end = UINT64_MAX - flp->nfsfl_off;
4735 flp->nfsfl_end = flp->nfsfl_off + retlen;
4736 flp->nfsfl_iomode = fxdr_unsigned(int, *tl++);
4737 if (gotiomode == -1)
4738 gotiomode = flp->nfsfl_iomode;
4739 NFSCL_DEBUG(4, "layg reqiom=%d retiom=%d\n", iomode,
4740 (int)flp->nfsfl_iomode);
4741 if (fxdr_unsigned(int, *tl++) !=
4742 NFSLAYOUT_NFSV4_1_FILES) {
4743 printf("NFSv4.1: got non-files layout\n");
4744 error = NFSERR_BADXDR;
4747 NFSBCOPY(++tl, flp->nfsfl_dev, NFSX_V4DEVICEID);
4748 tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4749 flp->nfsfl_util = fxdr_unsigned(uint32_t, *tl++);
4750 NFSCL_DEBUG(4, "flutil=0x%x\n", flp->nfsfl_util);
4751 flp->nfsfl_stripe1 = fxdr_unsigned(uint32_t, *tl++);
4752 flp->nfsfl_patoff = fxdr_hyper(tl); tl += 2;
4753 if (fxdr_unsigned(int, *tl) != fhcnt) {
4754 printf("EEK! bad fhcnt\n");
4755 error = NFSERR_BADXDR;
4758 for (j = 0; j < fhcnt; j++) {
4759 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4760 nfhlen = fxdr_unsigned(int, *tl);
4761 if (nfhlen <= 0 || nfhlen > NFSX_V4FHMAX) {
4762 error = NFSERR_BADXDR;
4765 nfhp = malloc(sizeof(*nfhp) + nfhlen - 1,
4767 flp->nfsfl_fh[j] = nfhp;
4769 nfhp->nfh_len = nfhlen;
4770 NFSM_DISSECT(cp, uint8_t *, NFSM_RNDUP(nfhlen));
4771 NFSBCOPY(cp, nfhp->nfh_fh, nfhlen);
4773 if (flp->nfsfl_iomode == gotiomode) {
4774 /* Keep the list in increasing offset order. */
4775 tflp = LIST_FIRST(flhp);
4777 while (tflp != NULL &&
4778 tflp->nfsfl_off < flp->nfsfl_off) {
4780 tflp = LIST_NEXT(tflp, nfsfl_list);
4782 if (prevflp == NULL)
4783 LIST_INSERT_HEAD(flhp, flp, nfsfl_list);
4785 LIST_INSERT_AFTER(prevflp, flp,
4788 printf("nfscl_layoutget(): got wrong iomode\n");
4789 nfscl_freeflayout(flp);
4794 if (nd->nd_repstat != 0 && error == 0)
4795 error = nd->nd_repstat;
4797 if (error != 0 && flp != NULL)
4798 nfscl_freeflayout(flp);
4799 mbuf_freem(nd->nd_mrep);
4804 * Do the NFSv4.1 Get Device Info.
4807 nfsrpc_getdeviceinfo(struct nfsmount *nmp, uint8_t *deviceid, int layouttype,
4808 uint32_t *notifybitsp, struct nfscldevinfo **ndip, struct ucred *cred,
4812 struct nfsrv_descript nfsd;
4813 struct nfsrv_descript *nd = &nfsd;
4814 struct sockaddr_storage ss;
4815 struct nfsclds *dsp = NULL, **dspp;
4816 struct nfscldevinfo *ndi;
4817 int addrcnt, bitcnt, error, i, isudp, j, pos, safilled, stripecnt;
4818 uint8_t stripeindex;
4822 nfscl_reqstart(nd, NFSPROC_GETDEVICEINFO, nmp, NULL, 0, NULL, NULL);
4823 NFSM_BUILD(tl, uint32_t *, NFSX_V4DEVICEID + 3 * NFSX_UNSIGNED);
4824 NFSBCOPY(deviceid, tl, NFSX_V4DEVICEID);
4825 tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4826 *tl++ = txdr_unsigned(layouttype);
4827 *tl++ = txdr_unsigned(100000);
4828 if (notifybitsp != NULL && *notifybitsp != 0) {
4829 *tl = txdr_unsigned(1); /* One word of bits. */
4830 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
4831 *tl = txdr_unsigned(*notifybitsp);
4833 *tl = txdr_unsigned(0);
4834 nd->nd_flag |= ND_USEGSSNAME;
4835 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4836 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4839 if (nd->nd_repstat == 0) {
4840 NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4841 if (layouttype != fxdr_unsigned(int, *tl++))
4842 printf("EEK! devinfo layout type not same!\n");
4843 stripecnt = fxdr_unsigned(int, *++tl);
4844 NFSCL_DEBUG(4, "stripecnt=%d\n", stripecnt);
4845 if (stripecnt < 1 || stripecnt > 4096) {
4846 printf("NFS devinfo stripecnt %d: out of range\n",
4848 error = NFSERR_BADXDR;
4851 NFSM_DISSECT(tl, uint32_t *, (stripecnt + 1) * NFSX_UNSIGNED);
4852 addrcnt = fxdr_unsigned(int, *(tl + stripecnt));
4853 NFSCL_DEBUG(4, "addrcnt=%d\n", addrcnt);
4854 if (addrcnt < 1 || addrcnt > 128) {
4855 printf("NFS devinfo addrcnt %d: out of range\n",
4857 error = NFSERR_BADXDR;
4862 * Now we know how many stripe indices and addresses, so
4863 * we can allocate the structure the correct size.
4865 i = (stripecnt * sizeof(uint8_t)) / sizeof(struct nfsclds *)
4867 NFSCL_DEBUG(4, "stripeindices=%d\n", i);
4868 ndi = malloc(sizeof(*ndi) + (addrcnt + i) *
4869 sizeof(struct nfsclds *), M_NFSDEVINFO, M_WAITOK | M_ZERO);
4870 NFSBCOPY(deviceid, ndi->nfsdi_deviceid, NFSX_V4DEVICEID);
4871 ndi->nfsdi_refcnt = 0;
4872 ndi->nfsdi_stripecnt = stripecnt;
4873 ndi->nfsdi_addrcnt = addrcnt;
4874 /* Fill in the stripe indices. */
4875 for (i = 0; i < stripecnt; i++) {
4876 stripeindex = fxdr_unsigned(uint8_t, *tl++);
4877 NFSCL_DEBUG(4, "stripeind=%d\n", stripeindex);
4878 if (stripeindex >= addrcnt) {
4879 printf("NFS devinfo stripeindex %d: too big\n",
4881 error = NFSERR_BADXDR;
4884 nfsfldi_setstripeindex(ndi, i, stripeindex);
4887 /* Now, dissect the server address(es). */
4889 for (i = 0; i < addrcnt; i++) {
4890 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4891 cnt = fxdr_unsigned(uint32_t, *tl);
4893 printf("NFS devinfo 0 len addrlist\n");
4894 error = NFSERR_BADXDR;
4897 dspp = nfsfldi_addr(ndi, i);
4898 pos = arc4random() % cnt; /* Choose one. */
4900 for (j = 0; j < cnt; j++) {
4901 error = nfsv4_getipaddr(nd, &ss, &isudp);
4902 if (error != 0 && error != EPERM) {
4903 error = NFSERR_BADXDR;
4906 if (error == 0 && isudp == 0) {
4909 * - use "pos" entry if it is of the
4910 * same af_family or none of them
4911 * is of the same af_family
4913 * - use the first one of the same
4916 if ((safilled == 0 && ss.ss_family ==
4917 nmp->nm_nam->sa_family) ||
4919 (safilled == 0 || ss.ss_family ==
4920 nmp->nm_nam->sa_family)) ||
4921 (safilled == 1 && ss.ss_family ==
4922 nmp->nm_nam->sa_family)) {
4923 error = nfsrpc_fillsa(nmp, &ss,
4928 nmp->nm_nam->sa_family)
4940 /* And the notify bits. */
4941 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4942 if (safilled != 0) {
4943 bitcnt = fxdr_unsigned(int, *tl);
4945 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4946 if (notifybitsp != NULL)
4948 fxdr_unsigned(uint32_t, *tl);
4954 if (nd->nd_repstat != 0)
4955 error = nd->nd_repstat;
4957 if (error != 0 && ndi != NULL)
4958 nfscl_freedevinfo(ndi);
4959 mbuf_freem(nd->nd_mrep);
4964 * Do the NFSv4.1 LayoutCommit.
4967 nfsrpc_layoutcommit(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
4968 uint64_t off, uint64_t len, uint64_t lastbyte, nfsv4stateid_t *stateidp,
4969 int layouttype, int layoutupdatecnt, uint8_t *layp, struct ucred *cred,
4970 NFSPROC_T *p, void *stuff)
4973 struct nfsrv_descript nfsd, *nd = &nfsd;
4974 int error, outcnt, i;
4977 nfscl_reqstart(nd, NFSPROC_LAYOUTCOMMIT, nmp, fh, fhlen, NULL, NULL);
4978 NFSM_BUILD(tl, uint32_t *, 5 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4980 txdr_hyper(off, tl);
4982 txdr_hyper(len, tl);
4985 *tl++ = newnfs_true;
4987 *tl++ = newnfs_false;
4988 *tl++ = txdr_unsigned(stateidp->seqid);
4989 *tl++ = stateidp->other[0];
4990 *tl++ = stateidp->other[1];
4991 *tl++ = stateidp->other[2];
4992 *tl++ = newnfs_true;
4995 else if (lastbyte >= (off + len))
4996 lastbyte = off + len - 1;
4997 txdr_hyper(lastbyte, tl);
4999 *tl++ = newnfs_false;
5000 *tl++ = txdr_unsigned(layouttype);
5001 *tl = txdr_unsigned(layoutupdatecnt);
5002 if (layoutupdatecnt > 0) {
5003 KASSERT(layouttype != NFSLAYOUT_NFSV4_1_FILES,
5004 ("Must be nil for Files Layout"));
5005 outcnt = NFSM_RNDUP(layoutupdatecnt);
5006 NFSM_BUILD(cp, uint8_t *, outcnt);
5007 NFSBCOPY(layp, cp, layoutupdatecnt);
5008 cp += layoutupdatecnt;
5009 for (i = 0; i < (outcnt - layoutupdatecnt); i++)
5012 nd->nd_flag |= ND_USEGSSNAME;
5013 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5014 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5017 error = nd->nd_repstat;
5018 mbuf_freem(nd->nd_mrep);
5023 * Do the NFSv4.1 LayoutReturn.
5026 nfsrpc_layoutreturn(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
5027 int layouttype, uint32_t iomode, int layoutreturn, uint64_t offset,
5028 uint64_t len, nfsv4stateid_t *stateidp, int layoutcnt, uint32_t *layp,
5029 struct ucred *cred, NFSPROC_T *p, void *stuff)
5032 struct nfsrv_descript nfsd, *nd = &nfsd;
5033 int error, outcnt, i;
5036 nfscl_reqstart(nd, NFSPROC_LAYOUTRETURN, nmp, fh, fhlen, NULL, NULL);
5037 NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
5039 *tl++ = newnfs_true;
5041 *tl++ = newnfs_false;
5042 *tl++ = txdr_unsigned(layouttype);
5043 *tl++ = txdr_unsigned(iomode);
5044 *tl = txdr_unsigned(layoutreturn);
5045 if (layoutreturn == NFSLAYOUTRETURN_FILE) {
5046 NFSM_BUILD(tl, uint32_t *, 2 * NFSX_HYPER + NFSX_STATEID +
5048 txdr_hyper(offset, tl);
5050 txdr_hyper(len, tl);
5052 NFSCL_DEBUG(4, "layoutret stseq=%d\n", (int)stateidp->seqid);
5053 *tl++ = txdr_unsigned(stateidp->seqid);
5054 *tl++ = stateidp->other[0];
5055 *tl++ = stateidp->other[1];
5056 *tl++ = stateidp->other[2];
5057 *tl = txdr_unsigned(layoutcnt);
5058 if (layoutcnt > 0) {
5059 outcnt = NFSM_RNDUP(layoutcnt);
5060 NFSM_BUILD(cp, uint8_t *, outcnt);
5061 NFSBCOPY(layp, cp, layoutcnt);
5063 for (i = 0; i < (outcnt - layoutcnt); i++)
5067 nd->nd_flag |= ND_USEGSSNAME;
5068 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5069 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5072 if (nd->nd_repstat == 0) {
5073 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5075 NFSM_DISSECT(tl, uint32_t *, NFSX_STATEID);
5076 stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
5077 stateidp->other[0] = *tl++;
5078 stateidp->other[1] = *tl++;
5079 stateidp->other[2] = *tl;
5082 error = nd->nd_repstat;
5084 mbuf_freem(nd->nd_mrep);
5089 * Acquire a layout and devinfo, if possible. The caller must have acquired
5090 * a reference count on the nfsclclient structure before calling this.
5091 * Return the layout in lypp with a reference count on it, if successful.
5094 nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
5095 int iomode, uint32_t *notifybitsp, nfsv4stateid_t *stateidp, uint64_t off,
5096 struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
5098 struct nfscllayout *lyp;
5099 struct nfsclflayout *flp, *tflp;
5100 struct nfscldevinfo *dip;
5101 struct nfsclflayouthead flh;
5102 int error = 0, islocked, layoutlen, recalled, retonclose;
5103 nfsv4stateid_t stateid;
5107 * If lyp is returned non-NULL, there will be a refcnt (shared lock)
5108 * on it, iff flp != NULL or a lock (exclusive lock) on it iff
5111 lyp = nfscl_getlayout(nmp->nm_clp, nfhp->nfh_fh, nfhp->nfh_len,
5112 off, &flp, &recalled);
5114 if (lyp == NULL || flp == NULL) {
5118 layoutlen = NFSMNT_MDSSESSION(nmp)->nfsess_maxcache -
5119 (NFSX_STATEID + 3 * NFSX_UNSIGNED);
5122 stateid.other[0] = stateidp->other[0];
5123 stateid.other[1] = stateidp->other[1];
5124 stateid.other[2] = stateidp->other[2];
5125 error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5126 nfhp->nfh_len, iomode, (uint64_t)0, INT64_MAX,
5127 (uint64_t)0, layoutlen, &stateid, &retonclose,
5128 &flh, cred, p, NULL);
5131 stateid.seqid = lyp->nfsly_stateid.seqid;
5132 stateid.other[0] = lyp->nfsly_stateid.other[0];
5133 stateid.other[1] = lyp->nfsly_stateid.other[1];
5134 stateid.other[2] = lyp->nfsly_stateid.other[2];
5135 error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5136 nfhp->nfh_len, iomode, off, INT64_MAX,
5137 (uint64_t)0, layoutlen, &stateid, &retonclose,
5138 &flh, cred, p, NULL);
5141 LIST_FOREACH(tflp, &flh, nfsfl_list) {
5142 error = nfscl_adddevinfo(nmp, NULL, tflp);
5144 error = nfsrpc_getdeviceinfo(nmp,
5146 NFSLAYOUT_NFSV4_1_FILES,
5147 notifybitsp, &dip, cred, p);
5150 error = nfscl_adddevinfo(nmp, dip,
5154 "getlayout: cannot add\n");
5159 * nfscl_layout() always returns with the nfsly_lock
5160 * set to a refcnt (shared lock).
5162 error = nfscl_layout(nmp, vp, nfhp->nfh_fh,
5163 nfhp->nfh_len, &stateid, retonclose, &flh, &lyp,
5167 } else if (islocked != 0)
5168 nfsv4_unlock(&lyp->nfsly_lock, 0);
5175 * Do a TCP connection plus exchange id and create session.
5176 * If successful, a "struct nfsclds" is linked into the list for the
5177 * mount point and a pointer to it is returned.
5180 nfsrpc_fillsa(struct nfsmount *nmp, struct sockaddr_storage *ssp,
5181 struct nfsclds **dspp, NFSPROC_T *p)
5183 struct sockaddr_in *msad, *sad, *ssd;
5184 struct sockaddr_in6 *msad6, *sad6, *ssd6;
5185 struct nfsclclient *clp;
5186 struct nfssockreq *nrp;
5187 struct nfsclds *dsp, *tdsp;
5189 enum nfsclds_state retv;
5190 uint32_t sequenceid;
5192 KASSERT(nmp->nm_sockreq.nr_cred != NULL,
5193 ("nfsrpc_fillsa: NULL nr_cred"));
5199 if (ssp->ss_family == AF_INET) {
5200 ssd = (struct sockaddr_in *)ssp;
5204 * Check to see if we already have a session for this
5205 * address that is usable for a DS.
5206 * Note that the MDS's address is in a different place
5207 * than the sessions already acquired for DS's.
5209 msad = (struct sockaddr_in *)nmp->nm_sockreq.nr_nam;
5210 tdsp = TAILQ_FIRST(&nmp->nm_sess);
5211 while (tdsp != NULL) {
5212 if (msad != NULL && msad->sin_family == AF_INET &&
5213 ssd->sin_addr.s_addr == msad->sin_addr.s_addr &&
5214 ssd->sin_port == msad->sin_port &&
5215 (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5218 NFSCL_DEBUG(4, "fnd same addr\n");
5221 tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5222 if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5223 msad = (struct sockaddr_in *)
5224 tdsp->nfsclds_sockp->nr_nam;
5230 /* No IP address match, so look for new/trunked one. */
5231 sad = malloc(sizeof(*sad), M_SONAME, M_WAITOK | M_ZERO);
5232 sad->sin_len = sizeof(*sad);
5233 sad->sin_family = AF_INET;
5234 sad->sin_port = ssd->sin_port;
5235 sad->sin_addr.s_addr = ssd->sin_addr.s_addr;
5236 nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5237 nrp->nr_nam = (struct sockaddr *)sad;
5238 } else if (ssp->ss_family == AF_INET6) {
5239 ssd6 = (struct sockaddr_in6 *)ssp;
5243 * Check to see if we already have a session for this
5244 * address that is usable for a DS.
5245 * Note that the MDS's address is in a different place
5246 * than the sessions already acquired for DS's.
5248 msad6 = (struct sockaddr_in6 *)nmp->nm_sockreq.nr_nam;
5249 tdsp = TAILQ_FIRST(&nmp->nm_sess);
5250 while (tdsp != NULL) {
5251 if (msad6 != NULL && msad6->sin6_family == AF_INET6 &&
5252 IN6_ARE_ADDR_EQUAL(&ssd6->sin6_addr,
5253 &msad6->sin6_addr) &&
5254 ssd6->sin6_port == msad6->sin6_port &&
5255 (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5260 tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5261 if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5262 msad6 = (struct sockaddr_in6 *)
5263 tdsp->nfsclds_sockp->nr_nam;
5269 /* No IP address match, so look for new/trunked one. */
5270 sad6 = malloc(sizeof(*sad6), M_SONAME, M_WAITOK | M_ZERO);
5271 sad6->sin6_len = sizeof(*sad6);
5272 sad6->sin6_family = AF_INET6;
5273 sad6->sin6_port = ssd6->sin6_port;
5274 NFSBCOPY(&ssd6->sin6_addr, &sad6->sin6_addr,
5275 sizeof(struct in6_addr));
5276 nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5277 nrp->nr_nam = (struct sockaddr *)sad6;
5281 nrp->nr_sotype = SOCK_STREAM;
5282 mtx_init(&nrp->nr_mtx, "nfssock", NULL, MTX_DEF);
5283 nrp->nr_prog = NFS_PROG;
5284 nrp->nr_vers = NFS_VER4;
5287 * Use the credentials that were used for the mount, which are
5288 * in nmp->nm_sockreq.nr_cred for newnfs_connect() etc.
5289 * Ref. counting the credentials with crhold() is probably not
5290 * necessary, since nm_sockreq.nr_cred won't be crfree()'d until
5291 * unmount, but I did it anyhow.
5293 nrp->nr_cred = crhold(nmp->nm_sockreq.nr_cred);
5294 error = newnfs_connect(nmp, nrp, NULL, p, 0);
5295 NFSCL_DEBUG(3, "DS connect=%d\n", error);
5297 /* Now, do the exchangeid and create session. */
5299 error = nfsrpc_exchangeid(nmp, clp, nrp, NFSV4EXCH_USEPNFSDS,
5300 &dsp, nrp->nr_cred, p);
5301 NFSCL_DEBUG(3, "DS exchangeid=%d\n", error);
5303 dsp->nfsclds_sockp = nrp;
5305 retv = nfscl_getsameserver(nmp, dsp, &tdsp);
5306 NFSCL_DEBUG(3, "getsame ret=%d\n", retv);
5307 if (retv == NFSDSP_USETHISSESSION) {
5310 * If there is already a session for this server,
5313 (void)newnfs_disconnect(nrp);
5314 nfscl_freenfsclds(dsp);
5318 if (retv == NFSDSP_SEQTHISSESSION)
5319 sequenceid = tdsp->nfsclds_sess.nfsess_sequenceid;
5321 sequenceid = dsp->nfsclds_sess.nfsess_sequenceid;
5323 error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
5324 nrp, sequenceid, 0, nrp->nr_cred, p);
5325 NFSCL_DEBUG(3, "DS createsess=%d\n", error);
5327 NFSFREECRED(nrp->nr_cred);
5328 NFSFREEMUTEX(&nrp->nr_mtx);
5329 free(nrp->nr_nam, M_SONAME);
5330 free(nrp, M_NFSSOCKREQ);
5333 NFSCL_DEBUG(3, "add DS session\n");
5335 * Put it at the end of the list. That way the list
5336 * is ordered by when the entry was added. This matters
5337 * since the one done first is the one that should be
5338 * used for sequencid'ing any subsequent create sessions.
5341 TAILQ_INSERT_TAIL(&nmp->nm_sess, dsp, nfsclds_list);
5344 } else if (dsp != NULL)
5345 nfscl_freenfsclds(dsp);
5350 * Do the NFSv4.1 Reclaim Complete.
5353 nfsrpc_reclaimcomplete(struct nfsmount *nmp, struct ucred *cred, NFSPROC_T *p)
5356 struct nfsrv_descript nfsd;
5357 struct nfsrv_descript *nd = &nfsd;
5360 nfscl_reqstart(nd, NFSPROC_RECLAIMCOMPL, nmp, NULL, 0, NULL, NULL);
5361 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
5363 nd->nd_flag |= ND_USEGSSNAME;
5364 error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5365 NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5368 error = nd->nd_repstat;
5369 mbuf_freem(nd->nd_mrep);
5374 * Initialize the slot tables for a session.
5377 nfscl_initsessionslots(struct nfsclsession *sep)
5381 for (i = 0; i < NFSV4_CBSLOTS; i++) {
5382 if (sep->nfsess_cbslots[i].nfssl_reply != NULL)
5383 m_freem(sep->nfsess_cbslots[i].nfssl_reply);
5384 NFSBZERO(&sep->nfsess_cbslots[i], sizeof(struct nfsslot));
5386 for (i = 0; i < 64; i++)
5387 sep->nfsess_slotseq[i] = 0;
5388 sep->nfsess_slots = 0;
5392 * Called to try and do an I/O operation via an NFSv4.1 Data Server (DS).
5395 nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5396 uint32_t rwaccess, struct ucred *cred, NFSPROC_T *p)
5398 struct nfsnode *np = VTONFS(vp);
5399 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5400 struct nfscllayout *layp;
5401 struct nfscldevinfo *dip;
5402 struct nfsclflayout *rflp;
5403 nfsv4stateid_t stateid;
5404 struct ucred *newcred;
5405 uint64_t lastbyte, len, off, oresid, xfer;
5406 int eof, error, iolaymode, recalled;
5409 if (!NFSHASPNFS(nmp) || nfscl_enablecallb == 0 || nfs_numnfscbd == 0 ||
5410 (np->n_flag & NNOLAYOUT) != 0)
5412 /* Now, get a reference cnt on the clientid for this mount. */
5413 if (nfscl_getref(nmp) == 0)
5416 /* Find an appropriate stateid. */
5417 newcred = NFSNEWCRED(cred);
5418 error = nfscl_getstateid(vp, np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
5419 rwaccess, 1, newcred, p, &stateid, &lckp);
5421 NFSFREECRED(newcred);
5425 /* Search for a layout for this file. */
5426 off = uiop->uio_offset;
5427 layp = nfscl_getlayout(nmp->nm_clp, np->n_fhp->nfh_fh,
5428 np->n_fhp->nfh_len, off, &rflp, &recalled);
5429 if (layp == NULL || rflp == NULL) {
5430 if (recalled != 0) {
5431 NFSFREECRED(newcred);
5436 nfscl_rellayout(layp, (rflp == NULL) ? 1 : 0);
5439 /* Try and get a Layout, if it is supported. */
5440 if (rwaccess == NFSV4OPEN_ACCESSWRITE ||
5441 (np->n_flag & NWRITEOPENED) != 0)
5442 iolaymode = NFSLAYOUTIOMODE_RW;
5444 iolaymode = NFSLAYOUTIOMODE_READ;
5445 error = nfsrpc_getlayout(nmp, vp, np->n_fhp, iolaymode,
5446 NULL, &stateid, off, &layp, newcred, p);
5449 np->n_flag |= NNOLAYOUT;
5452 nfscl_lockderef(lckp);
5453 NFSFREECRED(newcred);
5455 nfscl_rellayout(layp, 0);
5462 * Loop around finding a layout that works for the first part of
5463 * this I/O operation, and then call the function that actually
5467 len = (uint64_t)uiop->uio_resid;
5468 while (len > 0 && error == 0 && eof == 0) {
5469 off = uiop->uio_offset;
5470 error = nfscl_findlayoutforio(layp, off, rwaccess, &rflp);
5472 oresid = xfer = (uint64_t)uiop->uio_resid;
5473 if (xfer > (rflp->nfsfl_end - rflp->nfsfl_off))
5474 xfer = rflp->nfsfl_end - rflp->nfsfl_off;
5475 dip = nfscl_getdevinfo(nmp->nm_clp, rflp->nfsfl_dev,
5478 error = nfscl_doflayoutio(vp, uiop, iomode,
5479 must_commit, &eof, &stateid, rwaccess, dip,
5480 layp, rflp, off, xfer, newcred, p);
5481 nfscl_reldevinfo(dip);
5482 lastbyte = off + xfer - 1;
5485 if (lastbyte > layp->nfsly_lastbyte)
5486 layp->nfsly_lastbyte = lastbyte;
5492 len -= (oresid - (uint64_t)uiop->uio_resid);
5496 nfscl_lockderef(lckp);
5497 NFSFREECRED(newcred);
5498 nfscl_rellayout(layp, 0);
5504 * Find a file layout that will handle the first bytes of the requested
5505 * range and return the information from it needed to to the I/O operation.
5508 nfscl_findlayoutforio(struct nfscllayout *lyp, uint64_t off, uint32_t rwaccess,
5509 struct nfsclflayout **retflpp)
5511 struct nfsclflayout *flp, *nflp, *rflp;
5516 /* For reading, do the Read list first and then the Write list. */
5518 if (rw == NFSV4OPEN_ACCESSREAD)
5519 flp = LIST_FIRST(&lyp->nfsly_flayread);
5521 flp = LIST_FIRST(&lyp->nfsly_flayrw);
5522 while (flp != NULL) {
5523 nflp = LIST_NEXT(flp, nfsfl_list);
5524 if (flp->nfsfl_off > off)
5526 if (flp->nfsfl_end > off &&
5527 (rflp == NULL || rflp->nfsfl_end < flp->nfsfl_end))
5531 if (rw == NFSV4OPEN_ACCESSREAD)
5532 rw = NFSV4OPEN_ACCESSWRITE;
5537 /* This one covers the most bytes starting at off. */
5545 * Do I/O using an NFSv4.1 file layout.
5548 nfscl_doflayoutio(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5549 int *eofp, nfsv4stateid_t *stateidp, int rwflag, struct nfscldevinfo *dp,
5550 struct nfscllayout *lyp, struct nfsclflayout *flp, uint64_t off,
5551 uint64_t len, struct ucred *cred, NFSPROC_T *p)
5553 uint64_t io_off, rel_off, stripe_unit_size, transfer, xfer;
5554 int commit_thru_mds, error = 0, stripe_index, stripe_pos;
5557 struct nfsclds **dspp;
5560 rel_off = off - flp->nfsfl_patoff;
5561 stripe_unit_size = (flp->nfsfl_util >> 6) & 0x3ffffff;
5562 stripe_pos = (rel_off / stripe_unit_size + flp->nfsfl_stripe1) %
5563 dp->nfsdi_stripecnt;
5564 transfer = stripe_unit_size - (rel_off % stripe_unit_size);
5566 /* Loop around, doing I/O for each stripe unit. */
5567 while (len > 0 && error == 0) {
5568 stripe_index = nfsfldi_stripeindex(dp, stripe_pos);
5569 dspp = nfsfldi_addr(dp, stripe_index);
5574 if ((flp->nfsfl_util & NFSFLAYUTIL_DENSE) != 0) {
5576 if (stripe_pos >= flp->nfsfl_fhcnt)
5578 fhp = flp->nfsfl_fh[stripe_pos];
5579 io_off = (rel_off / (stripe_unit_size *
5580 dp->nfsdi_stripecnt)) * stripe_unit_size +
5581 rel_off % stripe_unit_size;
5583 /* Sparse layout. */
5584 if (flp->nfsfl_fhcnt > 1) {
5585 if (stripe_index >= flp->nfsfl_fhcnt)
5587 fhp = flp->nfsfl_fh[stripe_index];
5588 } else if (flp->nfsfl_fhcnt == 1)
5589 fhp = flp->nfsfl_fh[0];
5594 if ((flp->nfsfl_util & NFSFLAYUTIL_COMMIT_THRU_MDS) != 0)
5595 commit_thru_mds = 1;
5597 commit_thru_mds = 0;
5598 if (rwflag == FREAD)
5599 error = nfsrpc_readds(vp, uiop, stateidp, eofp, *dspp,
5600 io_off, xfer, fhp, cred, p);
5602 error = nfsrpc_writeds(vp, uiop, iomode, must_commit,
5603 stateidp, *dspp, io_off, xfer, fhp, commit_thru_mds,
5607 lyp->nfsly_flags |= NFSLY_WRITTEN;
5612 transfer = stripe_unit_size;
5613 stripe_pos = (stripe_pos + 1) % dp->nfsdi_stripecnt;
5622 * The actual read RPC done to a DS.
5625 nfsrpc_readds(vnode_t vp, struct uio *uiop, nfsv4stateid_t *stateidp, int *eofp,
5626 struct nfsclds *dsp, uint64_t io_off, int len, struct nfsfh *fhp,
5627 struct ucred *cred, NFSPROC_T *p)
5631 struct nfsrv_descript nfsd;
5632 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5633 struct nfsrv_descript *nd = &nfsd;
5634 struct nfssockreq *nrp;
5637 nfscl_reqstart(nd, NFSPROC_READDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5638 NULL, &dsp->nfsclds_sess);
5639 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5640 NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED * 3);
5641 txdr_hyper(io_off, tl);
5642 *(tl + 2) = txdr_unsigned(len);
5643 nrp = dsp->nfsclds_sockp;
5645 /* If NULL, use the MDS socket. */
5646 nrp = &nmp->nm_sockreq;
5647 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5648 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5651 if (nd->nd_repstat != 0) {
5652 error = nd->nd_repstat;
5655 NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5656 *eofp = fxdr_unsigned(int, *tl);
5657 NFSM_STRSIZ(retlen, len);
5658 error = nfsm_mbufuio(nd, uiop, retlen);
5660 if (nd->nd_mrep != NULL)
5661 mbuf_freem(nd->nd_mrep);
5666 * The actual write RPC done to a DS.
5669 nfsrpc_writeds(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5670 nfsv4stateid_t *stateidp, struct nfsclds *dsp, uint64_t io_off, int len,
5671 struct nfsfh *fhp, int commit_thru_mds, struct ucred *cred, NFSPROC_T *p)
5674 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5675 int error, rlen, commit, committed = NFSWRITE_FILESYNC;
5677 struct nfsrv_descript nfsd;
5678 struct nfsrv_descript *nd = &nfsd;
5679 struct nfssockreq *nrp;
5681 KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
5683 nfscl_reqstart(nd, NFSPROC_WRITEDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5684 NULL, &dsp->nfsclds_sess);
5685 nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5686 NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + 2 * NFSX_UNSIGNED);
5687 txdr_hyper(io_off, tl);
5689 *tl++ = txdr_unsigned(*iomode);
5690 *tl = txdr_unsigned(len);
5691 nfsm_uiombuf(nd, uiop, len);
5692 nrp = dsp->nfsclds_sockp;
5694 /* If NULL, use the MDS socket. */
5695 nrp = &nmp->nm_sockreq;
5696 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5697 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5700 if (nd->nd_repstat != 0) {
5702 * In case the rpc gets retried, roll
5703 * the uio fileds changed by nfsm_uiombuf()
5706 uiop->uio_offset -= len;
5707 uio_uio_resid_add(uiop, len);
5708 uio_iov_base_add(uiop, -len);
5709 uio_iov_len_add(uiop, len);
5710 error = nd->nd_repstat;
5712 NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_VERF);
5713 rlen = fxdr_unsigned(int, *tl++);
5717 } else if (rlen < len) {
5718 backup = len - rlen;
5719 uio_iov_base_add(uiop, -(backup));
5720 uio_iov_len_add(uiop, backup);
5721 uiop->uio_offset -= backup;
5722 uio_uio_resid_add(uiop, backup);
5725 commit = fxdr_unsigned(int, *tl++);
5728 * Return the lowest committment level
5729 * obtained by any of the RPCs.
5731 if (committed == NFSWRITE_FILESYNC)
5733 else if (committed == NFSWRITE_DATASYNC &&
5734 commit == NFSWRITE_UNSTABLE)
5736 if (commit_thru_mds != 0) {
5738 if (!NFSHASWRITEVERF(nmp)) {
5739 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5740 NFSSETWRITEVERF(nmp);
5741 } else if (NFSBCMP(tl, nmp->nm_verf, NFSX_VERF)) {
5743 NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5748 if ((dsp->nfsclds_flags & NFSCLDS_HASWRITEVERF) == 0) {
5749 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5750 dsp->nfsclds_flags |= NFSCLDS_HASWRITEVERF;
5751 } else if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5753 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5759 if (nd->nd_mrep != NULL)
5760 mbuf_freem(nd->nd_mrep);
5761 *iomode = committed;
5762 if (nd->nd_repstat != 0 && error == 0)
5763 error = nd->nd_repstat;
5768 * Free up the nfsclds structure.
5771 nfscl_freenfsclds(struct nfsclds *dsp)
5777 if (dsp->nfsclds_sockp != NULL) {
5778 NFSFREECRED(dsp->nfsclds_sockp->nr_cred);
5779 NFSFREEMUTEX(&dsp->nfsclds_sockp->nr_mtx);
5780 free(dsp->nfsclds_sockp->nr_nam, M_SONAME);
5781 free(dsp->nfsclds_sockp, M_NFSSOCKREQ);
5783 NFSFREEMUTEX(&dsp->nfsclds_mtx);
5784 NFSFREEMUTEX(&dsp->nfsclds_sess.nfsess_mtx);
5785 for (i = 0; i < NFSV4_CBSLOTS; i++) {
5786 if (dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply != NULL)
5788 dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply);
5790 free(dsp, M_NFSCLDS);
5793 static enum nfsclds_state
5794 nfscl_getsameserver(struct nfsmount *nmp, struct nfsclds *newdsp,
5795 struct nfsclds **retdspp)
5797 struct nfsclds *dsp, *cur_dsp;
5800 * Search the list of nfsclds structures for one with the same
5804 TAILQ_FOREACH(dsp, &nmp->nm_sess, nfsclds_list) {
5805 if (dsp->nfsclds_servownlen == newdsp->nfsclds_servownlen &&
5806 dsp->nfsclds_servownlen != 0 &&
5807 !NFSBCMP(dsp->nfsclds_serverown, newdsp->nfsclds_serverown,
5808 dsp->nfsclds_servownlen)) {
5809 NFSCL_DEBUG(4, "fnd same fdsp=%p dsp=%p flg=0x%x\n",
5810 TAILQ_FIRST(&nmp->nm_sess), dsp,
5811 dsp->nfsclds_flags);
5812 /* Server major id matches. */
5813 if ((dsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5815 return (NFSDSP_USETHISSESSION);
5819 * Note the first match, so it can be used for
5820 * sequence'ing new sessions.
5822 if (cur_dsp == NULL)
5826 if (cur_dsp != NULL) {
5828 return (NFSDSP_SEQTHISSESSION);
5830 return (NFSDSP_NOTFOUND);
5835 * NFS commit rpc to a DS.
5838 nfsrpc_commitds(vnode_t vp, uint64_t offset, int cnt, struct nfsclds *dsp,
5839 struct nfsfh *fhp, struct ucred *cred, NFSPROC_T *p, void *stuff)
5842 struct nfsrv_descript nfsd, *nd = &nfsd;
5843 struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5844 struct nfssockreq *nrp;
5847 nfscl_reqstart(nd, NFSPROC_COMMITDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5848 NULL, &dsp->nfsclds_sess);
5849 NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + NFSX_UNSIGNED);
5850 txdr_hyper(offset, tl);
5852 *tl = txdr_unsigned(cnt);
5853 nrp = dsp->nfsclds_sockp;
5855 /* If NULL, use the MDS socket. */
5856 nrp = &nmp->nm_sockreq;
5857 error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5858 NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5861 if (nd->nd_repstat == 0) {
5862 NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
5864 if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5865 NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5866 error = NFSERR_STALEWRITEVERF;
5871 if (error == 0 && nd->nd_repstat != 0)
5872 error = nd->nd_repstat;
5873 mbuf_freem(nd->nd_mrep);