nfs_clrpcops.c revision 265466
1/*-
2 * Copyright (c) 1989, 1993
3 *	The Regents of the University of California.  All rights reserved.
4 *
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 * 4. Neither the name of the University nor the names of its contributors
17 *    may be used to endorse or promote products derived from this software
18 *    without specific prior written permission.
19 *
20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 * SUCH DAMAGE.
31 *
32 */
33
34#include <sys/cdefs.h>
35__FBSDID("$FreeBSD: stable/10/sys/fs/nfsclient/nfs_clrpcops.c 265466 2014-05-06 21:47:43Z rmacklem $");
36
37/*
38 * Rpc op calls, generally called from the vnode op calls or through the
39 * buffer cache, for NFS v2, 3 and 4.
40 * These do not normally make any changes to vnode arguments or use
41 * structures that might change between the VFS variants. The returned
42 * arguments are all at the end, after the NFSPROC_T *p one.
43 */
44
45#ifndef APPLEKEXT
46#include "opt_inet6.h"
47
48#include <fs/nfs/nfsport.h>
49
50/*
51 * Global variables
52 */
53extern int nfs_numnfscbd;
54extern struct timeval nfsboottime;
55extern u_int32_t newnfs_false, newnfs_true;
56extern nfstype nfsv34_type[9];
57extern int nfsrv_useacl;
58extern char nfsv4_callbackaddr[INET6_ADDRSTRLEN];
59extern int nfscl_debuglevel;
60NFSCLSTATEMUTEX;
61int nfstest_outofseq = 0;
62int nfscl_assumeposixlocks = 1;
63int nfscl_enablecallb = 0;
64short nfsv4_cbport = NFSV4_CBPORT;
65int nfstest_openallsetattr = 0;
66#endif	/* !APPLEKEXT */
67
68#define	DIRHDSIZ	(sizeof (struct dirent) - (MAXNAMLEN + 1))
69
70/*
71 * nfscl_getsameserver() can return one of three values:
72 * NFSDSP_USETHISSESSION - Use this session for the DS.
73 * NFSDSP_SEQTHISSESSION - Use the nfsclds_sequence field of this dsp for new
74 *     session.
75 * NFSDSP_NOTFOUND - No matching server was found.
76 */
77enum nfsclds_state {
78	NFSDSP_USETHISSESSION = 0,
79	NFSDSP_SEQTHISSESSION = 1,
80	NFSDSP_NOTFOUND = 2,
81};
82
83static int nfsrpc_setattrrpc(vnode_t , struct vattr *, nfsv4stateid_t *,
84    struct ucred *, NFSPROC_T *, struct nfsvattr *, int *, void *);
85static int nfsrpc_readrpc(vnode_t , struct uio *, struct ucred *,
86    nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *, void *);
87static int nfsrpc_writerpc(vnode_t , struct uio *, int *, int *,
88    struct ucred *, nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *,
89    void *);
90static int nfsrpc_createv23(vnode_t , char *, int, struct vattr *,
91    nfsquad_t, int, struct ucred *, NFSPROC_T *, struct nfsvattr *,
92    struct nfsvattr *, struct nfsfh **, int *, int *, void *);
93static int nfsrpc_createv4(vnode_t , char *, int, struct vattr *,
94    nfsquad_t, int, struct nfsclowner *, struct nfscldeleg **, struct ucred *,
95    NFSPROC_T *, struct nfsvattr *, struct nfsvattr *, struct nfsfh **, int *,
96    int *, void *, int *);
97static int nfsrpc_locku(struct nfsrv_descript *, struct nfsmount *,
98    struct nfscllockowner *, u_int64_t, u_int64_t,
99    u_int32_t, struct ucred *, NFSPROC_T *, int);
100static int nfsrpc_setaclrpc(vnode_t, struct ucred *, NFSPROC_T *,
101    struct acl *, nfsv4stateid_t *, void *);
102static int nfsrpc_getlayout(struct nfsmount *, vnode_t, struct nfsfh *, int,
103    uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
104    struct ucred *, NFSPROC_T *);
105static int nfsrpc_fillsa(struct nfsmount *, struct sockaddr_storage *,
106    struct nfsclds **, NFSPROC_T *);
107static void nfscl_initsessionslots(struct nfsclsession *);
108static int nfscl_doflayoutio(vnode_t, struct uio *, int *, int *, int *,
109    nfsv4stateid_t *, int, struct nfscldevinfo *, struct nfscllayout *,
110    struct nfsclflayout *, uint64_t, uint64_t, struct ucred *, NFSPROC_T *);
111static int nfsrpc_readds(vnode_t, struct uio *, nfsv4stateid_t *, int *,
112    struct nfsclds *, uint64_t, int, struct nfsfh *, struct ucred *,
113    NFSPROC_T *);
114static int nfsrpc_writeds(vnode_t, struct uio *, int *, int *,
115    nfsv4stateid_t *, struct nfsclds *, uint64_t, int,
116    struct nfsfh *, int, struct ucred *, NFSPROC_T *);
117static enum nfsclds_state nfscl_getsameserver(struct nfsmount *,
118    struct nfsclds *, struct nfsclds **);
119#ifdef notyet
120static int nfsrpc_commitds(vnode_t, uint64_t, int, struct nfsclds *,
121    struct nfsfh *, struct ucred *, NFSPROC_T *, void *);
122#endif
123
124/*
125 * nfs null call from vfs.
126 */
127APPLESTATIC int
128nfsrpc_null(vnode_t vp, struct ucred *cred, NFSPROC_T *p)
129{
130	int error;
131	struct nfsrv_descript nfsd, *nd = &nfsd;
132
133	NFSCL_REQSTART(nd, NFSPROC_NULL, vp);
134	error = nfscl_request(nd, vp, p, cred, NULL);
135	if (nd->nd_repstat && !error)
136		error = nd->nd_repstat;
137	mbuf_freem(nd->nd_mrep);
138	return (error);
139}
140
141/*
142 * nfs access rpc op.
143 * For nfs version 3 and 4, use the access rpc to check accessibility. If file
144 * modes are changed on the server, accesses might still fail later.
145 */
146APPLESTATIC int
147nfsrpc_access(vnode_t vp, int acmode, struct ucred *cred,
148    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp)
149{
150	int error;
151	u_int32_t mode, rmode;
152
153	if (acmode & VREAD)
154		mode = NFSACCESS_READ;
155	else
156		mode = 0;
157	if (vnode_vtype(vp) == VDIR) {
158		if (acmode & VWRITE)
159			mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND |
160				 NFSACCESS_DELETE);
161		if (acmode & VEXEC)
162			mode |= NFSACCESS_LOOKUP;
163	} else {
164		if (acmode & VWRITE)
165			mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND);
166		if (acmode & VEXEC)
167			mode |= NFSACCESS_EXECUTE;
168	}
169
170	/*
171	 * Now, just call nfsrpc_accessrpc() to do the actual RPC.
172	 */
173	error = nfsrpc_accessrpc(vp, mode, cred, p, nap, attrflagp, &rmode,
174	    NULL);
175
176	/*
177	 * The NFS V3 spec does not clarify whether or not
178	 * the returned access bits can be a superset of
179	 * the ones requested, so...
180	 */
181	if (!error && (rmode & mode) != mode)
182		error = EACCES;
183	return (error);
184}
185
186/*
187 * The actual rpc, separated out for Darwin.
188 */
189APPLESTATIC int
190nfsrpc_accessrpc(vnode_t vp, u_int32_t mode, struct ucred *cred,
191    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, u_int32_t *rmodep,
192    void *stuff)
193{
194	u_int32_t *tl;
195	u_int32_t supported, rmode;
196	int error;
197	struct nfsrv_descript nfsd, *nd = &nfsd;
198	nfsattrbit_t attrbits;
199
200	*attrflagp = 0;
201	supported = mode;
202	NFSCL_REQSTART(nd, NFSPROC_ACCESS, vp);
203	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
204	*tl = txdr_unsigned(mode);
205	if (nd->nd_flag & ND_NFSV4) {
206		/*
207		 * And do a Getattr op.
208		 */
209		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
210		*tl = txdr_unsigned(NFSV4OP_GETATTR);
211		NFSGETATTR_ATTRBIT(&attrbits);
212		(void) nfsrv_putattrbit(nd, &attrbits);
213	}
214	error = nfscl_request(nd, vp, p, cred, stuff);
215	if (error)
216		return (error);
217	if (nd->nd_flag & ND_NFSV3) {
218		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
219		if (error)
220			goto nfsmout;
221	}
222	if (!nd->nd_repstat) {
223		if (nd->nd_flag & ND_NFSV4) {
224			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
225			supported = fxdr_unsigned(u_int32_t, *tl++);
226		} else {
227			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
228		}
229		rmode = fxdr_unsigned(u_int32_t, *tl);
230		if (nd->nd_flag & ND_NFSV4)
231			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
232
233		/*
234		 * It's not obvious what should be done about
235		 * unsupported access modes. For now, be paranoid
236		 * and clear the unsupported ones.
237		 */
238		rmode &= supported;
239		*rmodep = rmode;
240	} else
241		error = nd->nd_repstat;
242nfsmout:
243	mbuf_freem(nd->nd_mrep);
244	return (error);
245}
246
247/*
248 * nfs open rpc
249 */
250APPLESTATIC int
251nfsrpc_open(vnode_t vp, int amode, struct ucred *cred, NFSPROC_T *p)
252{
253	struct nfsclopen *op;
254	struct nfscldeleg *dp;
255	struct nfsfh *nfhp;
256	struct nfsnode *np = VTONFS(vp);
257	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
258	u_int32_t mode, clidrev;
259	int ret, newone, error, expireret = 0, retrycnt;
260
261	/*
262	 * For NFSv4, Open Ops are only done on Regular Files.
263	 */
264	if (vnode_vtype(vp) != VREG)
265		return (0);
266	mode = 0;
267	if (amode & FREAD)
268		mode |= NFSV4OPEN_ACCESSREAD;
269	if (amode & FWRITE)
270		mode |= NFSV4OPEN_ACCESSWRITE;
271	nfhp = np->n_fhp;
272
273	retrycnt = 0;
274#ifdef notdef
275{ char name[100]; int namel;
276namel = (np->n_v4->n4_namelen < 100) ? np->n_v4->n4_namelen : 99;
277bcopy(NFS4NODENAME(np->n_v4), name, namel);
278name[namel] = '\0';
279printf("rpcopen p=0x%x name=%s",p->p_pid,name);
280if (nfhp->nfh_len > 0) printf(" fh=0x%x\n",nfhp->nfh_fh[12]);
281else printf(" fhl=0\n");
282}
283#endif
284	do {
285	    dp = NULL;
286	    error = nfscl_open(vp, nfhp->nfh_fh, nfhp->nfh_len, mode, 1,
287		cred, p, NULL, &op, &newone, &ret, 1);
288	    if (error) {
289		return (error);
290	    }
291	    if (nmp->nm_clp != NULL)
292		clidrev = nmp->nm_clp->nfsc_clientidrev;
293	    else
294		clidrev = 0;
295	    if (ret == NFSCLOPEN_DOOPEN) {
296		if (np->n_v4 != NULL) {
297			error = nfsrpc_openrpc(nmp, vp, np->n_v4->n4_data,
298			   np->n_v4->n4_fhlen, np->n_fhp->nfh_fh,
299			   np->n_fhp->nfh_len, mode, op,
300			   NFS4NODENAME(np->n_v4), np->n_v4->n4_namelen, &dp,
301			   0, 0x0, cred, p, 0, 0);
302			if (dp != NULL) {
303#ifdef APPLE
304				OSBitAndAtomic((int32_t)~NDELEGMOD, (UInt32 *)&np->n_flag);
305#else
306				NFSLOCKNODE(np);
307				np->n_flag &= ~NDELEGMOD;
308				/*
309				 * Invalidate the attribute cache, so that
310				 * attributes that pre-date the issue of a
311				 * delegation are not cached, since the
312				 * cached attributes will remain valid while
313				 * the delegation is held.
314				 */
315				NFSINVALATTRCACHE(np);
316				NFSUNLOCKNODE(np);
317#endif
318				(void) nfscl_deleg(nmp->nm_mountp,
319				    op->nfso_own->nfsow_clp,
320				    nfhp->nfh_fh, nfhp->nfh_len, cred, p, &dp);
321			}
322		} else {
323			error = EIO;
324		}
325		newnfs_copyincred(cred, &op->nfso_cred);
326	    } else if (ret == NFSCLOPEN_SETCRED)
327		/*
328		 * This is a new local open on a delegation. It needs
329		 * to have credentials so that an open can be done
330		 * against the server during recovery.
331		 */
332		newnfs_copyincred(cred, &op->nfso_cred);
333
334	    /*
335	     * nfso_opencnt is the count of how many VOP_OPEN()s have
336	     * been done on this Open successfully and a VOP_CLOSE()
337	     * is expected for each of these.
338	     * If error is non-zero, don't increment it, since the Open
339	     * hasn't succeeded yet.
340	     */
341	    if (!error)
342		op->nfso_opencnt++;
343	    nfscl_openrelease(op, error, newone);
344	    if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
345		error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
346		error == NFSERR_BADSESSION) {
347		(void) nfs_catnap(PZERO, error, "nfs_open");
348	    } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
349		&& clidrev != 0) {
350		expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
351		retrycnt++;
352	    }
353	} while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
354	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
355	    error == NFSERR_BADSESSION ||
356	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
357	     expireret == 0 && clidrev != 0 && retrycnt < 4));
358	if (error && retrycnt >= 4)
359		error = EIO;
360	return (error);
361}
362
363/*
364 * the actual open rpc
365 */
366APPLESTATIC int
367nfsrpc_openrpc(struct nfsmount *nmp, vnode_t vp, u_int8_t *nfhp, int fhlen,
368    u_int8_t *newfhp, int newfhlen, u_int32_t mode, struct nfsclopen *op,
369    u_int8_t *name, int namelen, struct nfscldeleg **dpp,
370    int reclaim, u_int32_t delegtype, struct ucred *cred, NFSPROC_T *p,
371    int syscred, int recursed)
372{
373	u_int32_t *tl;
374	struct nfsrv_descript nfsd, *nd = &nfsd;
375	struct nfscldeleg *dp, *ndp = NULL;
376	struct nfsvattr nfsva;
377	u_int32_t rflags, deleg;
378	nfsattrbit_t attrbits;
379	int error, ret, acesize, limitby;
380
381	dp = *dpp;
382	*dpp = NULL;
383	nfscl_reqstart(nd, NFSPROC_OPEN, nmp, nfhp, fhlen, NULL, NULL);
384	NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
385	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
386	*tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
387	*tl++ = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
388	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
389	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
390	(void) nfsm_strtom(nd, op->nfso_own->nfsow_owner, NFSV4CL_LOCKNAMELEN);
391	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
392	*tl++ = txdr_unsigned(NFSV4OPEN_NOCREATE);
393	if (reclaim) {
394		*tl = txdr_unsigned(NFSV4OPEN_CLAIMPREVIOUS);
395		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
396		*tl = txdr_unsigned(delegtype);
397	} else {
398		if (dp != NULL) {
399			*tl = txdr_unsigned(NFSV4OPEN_CLAIMDELEGATECUR);
400			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
401			if (NFSHASNFSV4N(nmp))
402				*tl++ = 0;
403			else
404				*tl++ = dp->nfsdl_stateid.seqid;
405			*tl++ = dp->nfsdl_stateid.other[0];
406			*tl++ = dp->nfsdl_stateid.other[1];
407			*tl = dp->nfsdl_stateid.other[2];
408		} else {
409			*tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
410		}
411		(void) nfsm_strtom(nd, name, namelen);
412	}
413	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
414	*tl = txdr_unsigned(NFSV4OP_GETATTR);
415	NFSZERO_ATTRBIT(&attrbits);
416	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_CHANGE);
417	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TIMEMODIFY);
418	(void) nfsrv_putattrbit(nd, &attrbits);
419	if (syscred)
420		nd->nd_flag |= ND_USEGSSNAME;
421	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
422	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
423	if (error)
424		return (error);
425	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
426	if (!nd->nd_repstat) {
427		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
428		    6 * NFSX_UNSIGNED);
429		op->nfso_stateid.seqid = *tl++;
430		op->nfso_stateid.other[0] = *tl++;
431		op->nfso_stateid.other[1] = *tl++;
432		op->nfso_stateid.other[2] = *tl;
433		rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
434		error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
435		if (error)
436			goto nfsmout;
437		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
438		deleg = fxdr_unsigned(u_int32_t, *tl);
439		if (deleg == NFSV4OPEN_DELEGATEREAD ||
440		    deleg == NFSV4OPEN_DELEGATEWRITE) {
441			if (!(op->nfso_own->nfsow_clp->nfsc_flags &
442			      NFSCLFLAGS_FIRSTDELEG))
443				op->nfso_own->nfsow_clp->nfsc_flags |=
444				  (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
445			MALLOC(ndp, struct nfscldeleg *,
446			    sizeof (struct nfscldeleg) + newfhlen,
447			    M_NFSCLDELEG, M_WAITOK);
448			LIST_INIT(&ndp->nfsdl_owner);
449			LIST_INIT(&ndp->nfsdl_lock);
450			ndp->nfsdl_clp = op->nfso_own->nfsow_clp;
451			ndp->nfsdl_fhlen = newfhlen;
452			NFSBCOPY(newfhp, ndp->nfsdl_fh, newfhlen);
453			newnfs_copyincred(cred, &ndp->nfsdl_cred);
454			nfscl_lockinit(&ndp->nfsdl_rwlock);
455			NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
456			    NFSX_UNSIGNED);
457			ndp->nfsdl_stateid.seqid = *tl++;
458			ndp->nfsdl_stateid.other[0] = *tl++;
459			ndp->nfsdl_stateid.other[1] = *tl++;
460			ndp->nfsdl_stateid.other[2] = *tl++;
461			ret = fxdr_unsigned(int, *tl);
462			if (deleg == NFSV4OPEN_DELEGATEWRITE) {
463				ndp->nfsdl_flags = NFSCLDL_WRITE;
464				/*
465				 * Indicates how much the file can grow.
466				 */
467				NFSM_DISSECT(tl, u_int32_t *,
468				    3 * NFSX_UNSIGNED);
469				limitby = fxdr_unsigned(int, *tl++);
470				switch (limitby) {
471				case NFSV4OPEN_LIMITSIZE:
472					ndp->nfsdl_sizelimit = fxdr_hyper(tl);
473					break;
474				case NFSV4OPEN_LIMITBLOCKS:
475					ndp->nfsdl_sizelimit =
476					    fxdr_unsigned(u_int64_t, *tl++);
477					ndp->nfsdl_sizelimit *=
478					    fxdr_unsigned(u_int64_t, *tl);
479					break;
480				default:
481					error = NFSERR_BADXDR;
482					goto nfsmout;
483				};
484			} else {
485				ndp->nfsdl_flags = NFSCLDL_READ;
486			}
487			if (ret)
488				ndp->nfsdl_flags |= NFSCLDL_RECALL;
489			error = nfsrv_dissectace(nd, &ndp->nfsdl_ace, &ret,
490			    &acesize, p);
491			if (error)
492				goto nfsmout;
493		} else if (deleg != NFSV4OPEN_DELEGATENONE) {
494			error = NFSERR_BADXDR;
495			goto nfsmout;
496		}
497		NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
498		error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
499		    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
500		    NULL, NULL, NULL, p, cred);
501		if (error)
502			goto nfsmout;
503		if (ndp != NULL) {
504			ndp->nfsdl_change = nfsva.na_filerev;
505			ndp->nfsdl_modtime = nfsva.na_mtime;
506			ndp->nfsdl_flags |= NFSCLDL_MODTIMESET;
507		}
508		if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM)) {
509		    do {
510			ret = nfsrpc_openconfirm(vp, newfhp, newfhlen, op,
511			    cred, p);
512			if (ret == NFSERR_DELAY)
513			    (void) nfs_catnap(PZERO, ret, "nfs_open");
514		    } while (ret == NFSERR_DELAY);
515		    error = ret;
516		}
517		if ((rflags & NFSV4OPEN_LOCKTYPEPOSIX) ||
518		    nfscl_assumeposixlocks)
519		    op->nfso_posixlock = 1;
520		else
521		    op->nfso_posixlock = 0;
522
523		/*
524		 * If the server is handing out delegations, but we didn't
525		 * get one because an OpenConfirm was required, try the
526		 * Open again, to get a delegation. This is a harmless no-op,
527		 * from a server's point of view.
528		 */
529		if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM) &&
530		    (op->nfso_own->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG)
531		    && !error && dp == NULL && ndp == NULL && !recursed) {
532		    do {
533			ret = nfsrpc_openrpc(nmp, vp, nfhp, fhlen, newfhp,
534			    newfhlen, mode, op, name, namelen, &ndp, 0, 0x0,
535			    cred, p, syscred, 1);
536			if (ret == NFSERR_DELAY)
537			    (void) nfs_catnap(PZERO, ret, "nfs_open2");
538		    } while (ret == NFSERR_DELAY);
539		    if (ret) {
540			if (ndp != NULL)
541				FREE((caddr_t)ndp, M_NFSCLDELEG);
542			if (ret == NFSERR_STALECLIENTID ||
543			    ret == NFSERR_STALEDONTRECOVER ||
544			    ret == NFSERR_BADSESSION)
545				error = ret;
546		    }
547		}
548	}
549	if (nd->nd_repstat != 0 && error == 0)
550		error = nd->nd_repstat;
551	if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
552		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
553nfsmout:
554	if (!error)
555		*dpp = ndp;
556	else if (ndp != NULL)
557		FREE((caddr_t)ndp, M_NFSCLDELEG);
558	mbuf_freem(nd->nd_mrep);
559	return (error);
560}
561
562/*
563 * open downgrade rpc
564 */
565APPLESTATIC int
566nfsrpc_opendowngrade(vnode_t vp, u_int32_t mode, struct nfsclopen *op,
567    struct ucred *cred, NFSPROC_T *p)
568{
569	u_int32_t *tl;
570	struct nfsrv_descript nfsd, *nd = &nfsd;
571	int error;
572
573	NFSCL_REQSTART(nd, NFSPROC_OPENDOWNGRADE, vp);
574	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 3 * NFSX_UNSIGNED);
575	if (NFSHASNFSV4N(VFSTONFS(vnode_mount(vp))))
576		*tl++ = 0;
577	else
578		*tl++ = op->nfso_stateid.seqid;
579	*tl++ = op->nfso_stateid.other[0];
580	*tl++ = op->nfso_stateid.other[1];
581	*tl++ = op->nfso_stateid.other[2];
582	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
583	*tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
584	*tl = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
585	error = nfscl_request(nd, vp, p, cred, NULL);
586	if (error)
587		return (error);
588	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
589	if (!nd->nd_repstat) {
590		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
591		op->nfso_stateid.seqid = *tl++;
592		op->nfso_stateid.other[0] = *tl++;
593		op->nfso_stateid.other[1] = *tl++;
594		op->nfso_stateid.other[2] = *tl;
595	}
596	if (nd->nd_repstat && error == 0)
597		error = nd->nd_repstat;
598	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
599		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
600nfsmout:
601	mbuf_freem(nd->nd_mrep);
602	return (error);
603}
604
605/*
606 * V4 Close operation.
607 */
608APPLESTATIC int
609nfsrpc_close(vnode_t vp, int doclose, NFSPROC_T *p)
610{
611	struct nfsclclient *clp;
612	int error;
613
614	if (vnode_vtype(vp) != VREG)
615		return (0);
616	if (doclose)
617		error = nfscl_doclose(vp, &clp, p);
618	else
619		error = nfscl_getclose(vp, &clp);
620	if (error)
621		return (error);
622
623	nfscl_clientrelease(clp);
624	return (0);
625}
626
627/*
628 * Close the open.
629 */
630APPLESTATIC void
631nfsrpc_doclose(struct nfsmount *nmp, struct nfsclopen *op, NFSPROC_T *p)
632{
633	struct nfsrv_descript nfsd, *nd = &nfsd;
634	struct nfscllockowner *lp, *nlp;
635	struct nfscllock *lop, *nlop;
636	struct ucred *tcred;
637	u_int64_t off = 0, len = 0;
638	u_int32_t type = NFSV4LOCKT_READ;
639	int error, do_unlock, trycnt;
640
641	tcred = newnfs_getcred();
642	newnfs_copycred(&op->nfso_cred, tcred);
643	/*
644	 * (Theoretically this could be done in the same
645	 *  compound as the close, but having multiple
646	 *  sequenced Ops in the same compound might be
647	 *  too scary for some servers.)
648	 */
649	if (op->nfso_posixlock) {
650		off = 0;
651		len = NFS64BITSSET;
652		type = NFSV4LOCKT_READ;
653	}
654
655	/*
656	 * Since this function is only called from VOP_INACTIVE(), no
657	 * other thread will be manipulating this Open. As such, the
658	 * lock lists are not being changed by other threads, so it should
659	 * be safe to do this without locking.
660	 */
661	LIST_FOREACH(lp, &op->nfso_lock, nfsl_list) {
662		do_unlock = 1;
663		LIST_FOREACH_SAFE(lop, &lp->nfsl_lock, nfslo_list, nlop) {
664			if (op->nfso_posixlock == 0) {
665				off = lop->nfslo_first;
666				len = lop->nfslo_end - lop->nfslo_first;
667				if (lop->nfslo_type == F_WRLCK)
668					type = NFSV4LOCKT_WRITE;
669				else
670					type = NFSV4LOCKT_READ;
671			}
672			if (do_unlock) {
673				trycnt = 0;
674				do {
675					error = nfsrpc_locku(nd, nmp, lp, off,
676					    len, type, tcred, p, 0);
677					if ((nd->nd_repstat == NFSERR_GRACE ||
678					    nd->nd_repstat == NFSERR_DELAY) &&
679					    error == 0)
680						(void) nfs_catnap(PZERO,
681						    (int)nd->nd_repstat,
682						    "nfs_close");
683				} while ((nd->nd_repstat == NFSERR_GRACE ||
684				    nd->nd_repstat == NFSERR_DELAY) &&
685				    error == 0 && trycnt++ < 5);
686				if (op->nfso_posixlock)
687					do_unlock = 0;
688			}
689			nfscl_freelock(lop, 0);
690		}
691		/*
692		 * Do a ReleaseLockOwner.
693		 * The lock owner name nfsl_owner may be used by other opens for
694		 * other files but the lock_owner4 name that nfsrpc_rellockown()
695		 * puts on the wire has the file handle for this file appended
696		 * to it, so it can be done now.
697		 */
698		(void)nfsrpc_rellockown(nmp, lp, lp->nfsl_open->nfso_fh,
699		    lp->nfsl_open->nfso_fhlen, tcred, p);
700	}
701
702	/*
703	 * There could be other Opens for different files on the same
704	 * OpenOwner, so locking is required.
705	 */
706	NFSLOCKCLSTATE();
707	nfscl_lockexcl(&op->nfso_own->nfsow_rwlock, NFSCLSTATEMUTEXPTR);
708	NFSUNLOCKCLSTATE();
709	do {
710		error = nfscl_tryclose(op, tcred, nmp, p);
711		if (error == NFSERR_GRACE)
712			(void) nfs_catnap(PZERO, error, "nfs_close");
713	} while (error == NFSERR_GRACE);
714	NFSLOCKCLSTATE();
715	nfscl_lockunlock(&op->nfso_own->nfsow_rwlock);
716
717	LIST_FOREACH_SAFE(lp, &op->nfso_lock, nfsl_list, nlp)
718		nfscl_freelockowner(lp, 0);
719	nfscl_freeopen(op, 0);
720	NFSUNLOCKCLSTATE();
721	NFSFREECRED(tcred);
722}
723
724/*
725 * The actual Close RPC.
726 */
727APPLESTATIC int
728nfsrpc_closerpc(struct nfsrv_descript *nd, struct nfsmount *nmp,
729    struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p,
730    int syscred)
731{
732	u_int32_t *tl;
733	int error;
734
735	nfscl_reqstart(nd, NFSPROC_CLOSE, nmp, op->nfso_fh,
736	    op->nfso_fhlen, NULL, NULL);
737	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
738	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
739	if (NFSHASNFSV4N(nmp))
740		*tl++ = 0;
741	else
742		*tl++ = op->nfso_stateid.seqid;
743	*tl++ = op->nfso_stateid.other[0];
744	*tl++ = op->nfso_stateid.other[1];
745	*tl = op->nfso_stateid.other[2];
746	if (syscred)
747		nd->nd_flag |= ND_USEGSSNAME;
748	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
749	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
750	if (error)
751		return (error);
752	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
753	if (nd->nd_repstat == 0)
754		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
755	error = nd->nd_repstat;
756	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
757		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
758nfsmout:
759	mbuf_freem(nd->nd_mrep);
760	return (error);
761}
762
763/*
764 * V4 Open Confirm RPC.
765 */
766APPLESTATIC int
767nfsrpc_openconfirm(vnode_t vp, u_int8_t *nfhp, int fhlen,
768    struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p)
769{
770	u_int32_t *tl;
771	struct nfsrv_descript nfsd, *nd = &nfsd;
772	struct nfsmount *nmp;
773	int error;
774
775	nmp = VFSTONFS(vnode_mount(vp));
776	if (NFSHASNFSV4N(nmp))
777		return (0);		/* No confirmation for NFSv4.1. */
778	nfscl_reqstart(nd, NFSPROC_OPENCONFIRM, nmp, nfhp, fhlen, NULL, NULL);
779	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
780	*tl++ = op->nfso_stateid.seqid;
781	*tl++ = op->nfso_stateid.other[0];
782	*tl++ = op->nfso_stateid.other[1];
783	*tl++ = op->nfso_stateid.other[2];
784	*tl = txdr_unsigned(op->nfso_own->nfsow_seqid);
785	error = nfscl_request(nd, vp, p, cred, NULL);
786	if (error)
787		return (error);
788	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
789	if (!nd->nd_repstat) {
790		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
791		op->nfso_stateid.seqid = *tl++;
792		op->nfso_stateid.other[0] = *tl++;
793		op->nfso_stateid.other[1] = *tl++;
794		op->nfso_stateid.other[2] = *tl;
795	}
796	error = nd->nd_repstat;
797	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
798		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
799nfsmout:
800	mbuf_freem(nd->nd_mrep);
801	return (error);
802}
803
804/*
805 * Do the setclientid and setclientid confirm RPCs. Called from nfs_statfs()
806 * when a mount has just occurred and when the server replies NFSERR_EXPIRED.
807 */
808APPLESTATIC int
809nfsrpc_setclient(struct nfsmount *nmp, struct nfsclclient *clp, int reclaim,
810    struct ucred *cred, NFSPROC_T *p)
811{
812	u_int32_t *tl;
813	struct nfsrv_descript nfsd;
814	struct nfsrv_descript *nd = &nfsd;
815	nfsattrbit_t attrbits;
816	u_int8_t *cp = NULL, *cp2, addr[INET6_ADDRSTRLEN + 9];
817	u_short port;
818	int error, isinet6 = 0, callblen;
819	nfsquad_t confirm;
820	u_int32_t lease;
821	static u_int32_t rev = 0;
822	struct nfsclds *dsp, *ndsp, *tdsp;
823
824	if (nfsboottime.tv_sec == 0)
825		NFSSETBOOTTIME(nfsboottime);
826	clp->nfsc_rev = rev++;
827	if (NFSHASNFSV4N(nmp)) {
828		error = nfsrpc_exchangeid(nmp, clp, &nmp->nm_sockreq,
829		    NFSV4EXCH_USEPNFSMDS | NFSV4EXCH_USENONPNFS, &dsp, cred, p);
830		NFSCL_DEBUG(1, "aft exch=%d\n", error);
831		if (error == 0) {
832			error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
833			    &nmp->nm_sockreq,
834			    dsp->nfsclds_sess.nfsess_sequenceid, 1, cred, p);
835			if (error == 0) {
836				NFSLOCKMNT(nmp);
837				TAILQ_FOREACH_SAFE(tdsp, &nmp->nm_sess,
838				    nfsclds_list, ndsp)
839					nfscl_freenfsclds(tdsp);
840				TAILQ_INIT(&nmp->nm_sess);
841				TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp,
842				    nfsclds_list);
843				NFSUNLOCKMNT(nmp);
844			} else
845				nfscl_freenfsclds(dsp);
846			NFSCL_DEBUG(1, "aft createsess=%d\n", error);
847		}
848		if (error == 0 && reclaim == 0) {
849			error = nfsrpc_reclaimcomplete(nmp, cred, p);
850			NFSCL_DEBUG(1, "aft reclaimcomp=%d\n", error);
851			if (error == NFSERR_COMPLETEALREADY ||
852			    error == NFSERR_NOTSUPP)
853				/* Ignore this error. */
854				error = 0;
855		}
856		return (error);
857	}
858
859	/*
860	 * Allocate a single session structure for NFSv4.0, because some of
861	 * the fields are used by NFSv4.0 although it doesn't do a session.
862	 */
863	dsp = malloc(sizeof(struct nfsclds), M_NFSCLDS, M_WAITOK | M_ZERO);
864	mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
865	mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession", NULL, MTX_DEF);
866	NFSLOCKMNT(nmp);
867	TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp, nfsclds_list);
868	NFSUNLOCKMNT(nmp);
869
870	nfscl_reqstart(nd, NFSPROC_SETCLIENTID, nmp, NULL, 0, NULL, NULL);
871	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
872	*tl++ = txdr_unsigned(nfsboottime.tv_sec);
873	*tl = txdr_unsigned(clp->nfsc_rev);
874	(void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
875
876	/*
877	 * set up the callback address
878	 */
879	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
880	*tl = txdr_unsigned(NFS_CALLBCKPROG);
881	callblen = strlen(nfsv4_callbackaddr);
882	if (callblen == 0)
883		cp = nfscl_getmyip(nmp, &isinet6);
884	if (nfscl_enablecallb && nfs_numnfscbd > 0 &&
885	    (callblen > 0 || cp != NULL)) {
886		port = htons(nfsv4_cbport);
887		cp2 = (u_int8_t *)&port;
888#ifdef INET6
889		if ((callblen > 0 &&
890		     strchr(nfsv4_callbackaddr, ':')) || isinet6) {
891			char ip6buf[INET6_ADDRSTRLEN], *ip6add;
892
893			(void) nfsm_strtom(nd, "tcp6", 4);
894			if (callblen == 0) {
895				ip6_sprintf(ip6buf, (struct in6_addr *)cp);
896				ip6add = ip6buf;
897			} else {
898				ip6add = nfsv4_callbackaddr;
899			}
900			snprintf(addr, INET6_ADDRSTRLEN + 9, "%s.%d.%d",
901			    ip6add, cp2[0], cp2[1]);
902		} else
903#endif
904		{
905			(void) nfsm_strtom(nd, "tcp", 3);
906			if (callblen == 0)
907				snprintf(addr, INET6_ADDRSTRLEN + 9,
908				    "%d.%d.%d.%d.%d.%d", cp[0], cp[1],
909				    cp[2], cp[3], cp2[0], cp2[1]);
910			else
911				snprintf(addr, INET6_ADDRSTRLEN + 9,
912				    "%s.%d.%d", nfsv4_callbackaddr,
913				    cp2[0], cp2[1]);
914		}
915		(void) nfsm_strtom(nd, addr, strlen(addr));
916	} else {
917		(void) nfsm_strtom(nd, "tcp", 3);
918		(void) nfsm_strtom(nd, "0.0.0.0.0.0", 11);
919	}
920	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
921	*tl = txdr_unsigned(clp->nfsc_cbident);
922	nd->nd_flag |= ND_USEGSSNAME;
923	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
924		NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
925	if (error)
926		return (error);
927	if (nd->nd_repstat == 0) {
928	    NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
929	    NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0] = *tl++;
930	    NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1] = *tl++;
931	    confirm.lval[0] = *tl++;
932	    confirm.lval[1] = *tl;
933	    mbuf_freem(nd->nd_mrep);
934	    nd->nd_mrep = NULL;
935
936	    /*
937	     * and confirm it.
938	     */
939	    nfscl_reqstart(nd, NFSPROC_SETCLIENTIDCFRM, nmp, NULL, 0, NULL,
940		NULL);
941	    NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
942	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
943	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
944	    *tl++ = confirm.lval[0];
945	    *tl = confirm.lval[1];
946	    nd->nd_flag |= ND_USEGSSNAME;
947	    error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
948		cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
949	    if (error)
950		return (error);
951	    mbuf_freem(nd->nd_mrep);
952	    nd->nd_mrep = NULL;
953	    if (nd->nd_repstat == 0) {
954		nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, nmp->nm_fh,
955		    nmp->nm_fhsize, NULL, NULL);
956		NFSZERO_ATTRBIT(&attrbits);
957		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
958		(void) nfsrv_putattrbit(nd, &attrbits);
959		nd->nd_flag |= ND_USEGSSNAME;
960		error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
961		    cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
962		if (error)
963		    return (error);
964		if (nd->nd_repstat == 0) {
965		    error = nfsv4_loadattr(nd, NULL, NULL, NULL, NULL, 0, NULL,
966			NULL, NULL, NULL, NULL, 0, NULL, &lease, NULL, p, cred);
967		    if (error)
968			goto nfsmout;
969		    clp->nfsc_renew = NFSCL_RENEW(lease);
970		    clp->nfsc_expire = NFSD_MONOSEC + clp->nfsc_renew;
971		    clp->nfsc_clientidrev++;
972		    if (clp->nfsc_clientidrev == 0)
973			clp->nfsc_clientidrev++;
974		}
975	    }
976	}
977	error = nd->nd_repstat;
978nfsmout:
979	mbuf_freem(nd->nd_mrep);
980	return (error);
981}
982
983/*
984 * nfs getattr call.
985 */
986APPLESTATIC int
987nfsrpc_getattr(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
988    struct nfsvattr *nap, void *stuff)
989{
990	struct nfsrv_descript nfsd, *nd = &nfsd;
991	int error;
992	nfsattrbit_t attrbits;
993
994	NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
995	if (nd->nd_flag & ND_NFSV4) {
996		NFSGETATTR_ATTRBIT(&attrbits);
997		(void) nfsrv_putattrbit(nd, &attrbits);
998	}
999	error = nfscl_request(nd, vp, p, cred, stuff);
1000	if (error)
1001		return (error);
1002	if (!nd->nd_repstat)
1003		error = nfsm_loadattr(nd, nap);
1004	else
1005		error = nd->nd_repstat;
1006	mbuf_freem(nd->nd_mrep);
1007	return (error);
1008}
1009
1010/*
1011 * nfs getattr call with non-vnode arguemnts.
1012 */
1013APPLESTATIC int
1014nfsrpc_getattrnovp(struct nfsmount *nmp, u_int8_t *fhp, int fhlen, int syscred,
1015    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, u_int64_t *xidp,
1016    uint32_t *leasep)
1017{
1018	struct nfsrv_descript nfsd, *nd = &nfsd;
1019	int error, vers = NFS_VER2;
1020	nfsattrbit_t attrbits;
1021
1022	nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, fhp, fhlen, NULL, NULL);
1023	if (nd->nd_flag & ND_NFSV4) {
1024		vers = NFS_VER4;
1025		NFSGETATTR_ATTRBIT(&attrbits);
1026		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
1027		(void) nfsrv_putattrbit(nd, &attrbits);
1028	} else if (nd->nd_flag & ND_NFSV3) {
1029		vers = NFS_VER3;
1030	}
1031	if (syscred)
1032		nd->nd_flag |= ND_USEGSSNAME;
1033	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
1034	    NFS_PROG, vers, NULL, 1, xidp, NULL);
1035	if (error)
1036		return (error);
1037	if (nd->nd_repstat == 0) {
1038		if ((nd->nd_flag & ND_NFSV4) != 0)
1039			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
1040			    NULL, NULL, NULL, NULL, NULL, 0, NULL, leasep, NULL,
1041			    NULL, NULL);
1042		else
1043			error = nfsm_loadattr(nd, nap);
1044	} else
1045		error = nd->nd_repstat;
1046	mbuf_freem(nd->nd_mrep);
1047	return (error);
1048}
1049
1050/*
1051 * Do an nfs setattr operation.
1052 */
1053APPLESTATIC int
1054nfsrpc_setattr(vnode_t vp, struct vattr *vap, NFSACL_T *aclp,
1055    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *rnap, int *attrflagp,
1056    void *stuff)
1057{
1058	int error, expireret = 0, openerr, retrycnt;
1059	u_int32_t clidrev = 0, mode;
1060	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1061	struct nfsfh *nfhp;
1062	nfsv4stateid_t stateid;
1063	void *lckp;
1064
1065	if (nmp->nm_clp != NULL)
1066		clidrev = nmp->nm_clp->nfsc_clientidrev;
1067	if (vap != NULL && NFSATTRISSET(u_quad_t, vap, va_size))
1068		mode = NFSV4OPEN_ACCESSWRITE;
1069	else
1070		mode = NFSV4OPEN_ACCESSREAD;
1071	retrycnt = 0;
1072	do {
1073		lckp = NULL;
1074		openerr = 1;
1075		if (NFSHASNFSV4(nmp)) {
1076			nfhp = VTONFS(vp)->n_fhp;
1077			error = nfscl_getstateid(vp, nfhp->nfh_fh,
1078			    nfhp->nfh_len, mode, 0, cred, p, &stateid, &lckp);
1079			if (error && vnode_vtype(vp) == VREG &&
1080			    (mode == NFSV4OPEN_ACCESSWRITE ||
1081			     nfstest_openallsetattr)) {
1082				/*
1083				 * No Open stateid, so try and open the file
1084				 * now.
1085				 */
1086				if (mode == NFSV4OPEN_ACCESSWRITE)
1087					openerr = nfsrpc_open(vp, FWRITE, cred,
1088					    p);
1089				else
1090					openerr = nfsrpc_open(vp, FREAD, cred,
1091					    p);
1092				if (!openerr)
1093					(void) nfscl_getstateid(vp,
1094					    nfhp->nfh_fh, nfhp->nfh_len,
1095					    mode, 0, cred, p, &stateid, &lckp);
1096			}
1097		}
1098		if (vap != NULL)
1099			error = nfsrpc_setattrrpc(vp, vap, &stateid, cred, p,
1100			    rnap, attrflagp, stuff);
1101		else
1102			error = nfsrpc_setaclrpc(vp, cred, p, aclp, &stateid,
1103			    stuff);
1104		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1105			nfscl_initiate_recovery(nmp->nm_clp);
1106		if (lckp != NULL)
1107			nfscl_lockderef(lckp);
1108		if (!openerr)
1109			(void) nfsrpc_close(vp, 0, p);
1110		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1111		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1112		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1113			(void) nfs_catnap(PZERO, error, "nfs_setattr");
1114		} else if ((error == NFSERR_EXPIRED ||
1115		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1116			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1117		}
1118		retrycnt++;
1119	} while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1120	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1121	    error == NFSERR_BADSESSION ||
1122	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1123	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1124	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1125	if (error && retrycnt >= 4)
1126		error = EIO;
1127	return (error);
1128}
1129
1130static int
1131nfsrpc_setattrrpc(vnode_t vp, struct vattr *vap,
1132    nfsv4stateid_t *stateidp, struct ucred *cred, NFSPROC_T *p,
1133    struct nfsvattr *rnap, int *attrflagp, void *stuff)
1134{
1135	u_int32_t *tl;
1136	struct nfsrv_descript nfsd, *nd = &nfsd;
1137	int error;
1138	nfsattrbit_t attrbits;
1139
1140	*attrflagp = 0;
1141	NFSCL_REQSTART(nd, NFSPROC_SETATTR, vp);
1142	if (nd->nd_flag & ND_NFSV4)
1143		nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1144	vap->va_type = vnode_vtype(vp);
1145	nfscl_fillsattr(nd, vap, vp, NFSSATTR_FULL, 0);
1146	if (nd->nd_flag & ND_NFSV3) {
1147		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1148		*tl = newnfs_false;
1149	} else if (nd->nd_flag & ND_NFSV4) {
1150		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1151		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1152		NFSGETATTR_ATTRBIT(&attrbits);
1153		(void) nfsrv_putattrbit(nd, &attrbits);
1154	}
1155	error = nfscl_request(nd, vp, p, cred, stuff);
1156	if (error)
1157		return (error);
1158	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1159		error = nfscl_wcc_data(nd, vp, rnap, attrflagp, NULL, stuff);
1160	if ((nd->nd_flag & ND_NFSV4) && !error)
1161		error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1162	if (!(nd->nd_flag & ND_NFSV3) && !nd->nd_repstat && !error)
1163		error = nfscl_postop_attr(nd, rnap, attrflagp, stuff);
1164	mbuf_freem(nd->nd_mrep);
1165	if (nd->nd_repstat && !error)
1166		error = nd->nd_repstat;
1167	return (error);
1168}
1169
1170/*
1171 * nfs lookup rpc
1172 */
1173APPLESTATIC int
1174nfsrpc_lookup(vnode_t dvp, char *name, int len, struct ucred *cred,
1175    NFSPROC_T *p, struct nfsvattr *dnap, struct nfsvattr *nap,
1176    struct nfsfh **nfhpp, int *attrflagp, int *dattrflagp, void *stuff)
1177{
1178	u_int32_t *tl;
1179	struct nfsrv_descript nfsd, *nd = &nfsd;
1180	struct nfsmount *nmp;
1181	struct nfsnode *np;
1182	struct nfsfh *nfhp;
1183	nfsattrbit_t attrbits;
1184	int error = 0, lookupp = 0;
1185
1186	*attrflagp = 0;
1187	*dattrflagp = 0;
1188	if (vnode_vtype(dvp) != VDIR)
1189		return (ENOTDIR);
1190	nmp = VFSTONFS(vnode_mount(dvp));
1191	if (len > NFS_MAXNAMLEN)
1192		return (ENAMETOOLONG);
1193	if (NFSHASNFSV4(nmp) && len == 1 &&
1194		name[0] == '.') {
1195		/*
1196		 * Just return the current dir's fh.
1197		 */
1198		np = VTONFS(dvp);
1199		MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1200			np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1201		nfhp->nfh_len = np->n_fhp->nfh_len;
1202		NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1203		*nfhpp = nfhp;
1204		return (0);
1205	}
1206	if (NFSHASNFSV4(nmp) && len == 2 &&
1207		name[0] == '.' && name[1] == '.') {
1208		lookupp = 1;
1209		NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, dvp);
1210	} else {
1211		NFSCL_REQSTART(nd, NFSPROC_LOOKUP, dvp);
1212		(void) nfsm_strtom(nd, name, len);
1213	}
1214	if (nd->nd_flag & ND_NFSV4) {
1215		NFSGETATTR_ATTRBIT(&attrbits);
1216		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1217		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
1218		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1219		(void) nfsrv_putattrbit(nd, &attrbits);
1220	}
1221	error = nfscl_request(nd, dvp, p, cred, stuff);
1222	if (error)
1223		return (error);
1224	if (nd->nd_repstat) {
1225		/*
1226		 * When an NFSv4 Lookupp returns ENOENT, it means that
1227		 * the lookup is at the root of an fs, so return this dir.
1228		 */
1229		if (nd->nd_repstat == NFSERR_NOENT && lookupp) {
1230		    np = VTONFS(dvp);
1231		    MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1232			np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1233		    nfhp->nfh_len = np->n_fhp->nfh_len;
1234		    NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1235		    *nfhpp = nfhp;
1236		    mbuf_freem(nd->nd_mrep);
1237		    return (0);
1238		}
1239		if (nd->nd_flag & ND_NFSV3)
1240		    error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1241		else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
1242		    ND_NFSV4) {
1243			/* Load the directory attributes. */
1244			error = nfsm_loadattr(nd, dnap);
1245			if (error == 0)
1246				*dattrflagp = 1;
1247		}
1248		goto nfsmout;
1249	}
1250	if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
1251		/* Load the directory attributes. */
1252		error = nfsm_loadattr(nd, dnap);
1253		if (error != 0)
1254			goto nfsmout;
1255		*dattrflagp = 1;
1256		/* Skip over the Lookup and GetFH operation status values. */
1257		NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1258	}
1259	error = nfsm_getfh(nd, nfhpp);
1260	if (error)
1261		goto nfsmout;
1262
1263	error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1264	if ((nd->nd_flag & ND_NFSV3) && !error)
1265		error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1266nfsmout:
1267	mbuf_freem(nd->nd_mrep);
1268	if (!error && nd->nd_repstat)
1269		error = nd->nd_repstat;
1270	return (error);
1271}
1272
1273/*
1274 * Do a readlink rpc.
1275 */
1276APPLESTATIC int
1277nfsrpc_readlink(vnode_t vp, struct uio *uiop, struct ucred *cred,
1278    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1279{
1280	u_int32_t *tl;
1281	struct nfsrv_descript nfsd, *nd = &nfsd;
1282	struct nfsnode *np = VTONFS(vp);
1283	nfsattrbit_t attrbits;
1284	int error, len, cangetattr = 1;
1285
1286	*attrflagp = 0;
1287	NFSCL_REQSTART(nd, NFSPROC_READLINK, vp);
1288	if (nd->nd_flag & ND_NFSV4) {
1289		/*
1290		 * And do a Getattr op.
1291		 */
1292		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1293		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1294		NFSGETATTR_ATTRBIT(&attrbits);
1295		(void) nfsrv_putattrbit(nd, &attrbits);
1296	}
1297	error = nfscl_request(nd, vp, p, cred, stuff);
1298	if (error)
1299		return (error);
1300	if (nd->nd_flag & ND_NFSV3)
1301		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1302	if (!nd->nd_repstat && !error) {
1303		NFSM_STRSIZ(len, NFS_MAXPATHLEN);
1304		/*
1305		 * This seems weird to me, but must have been added to
1306		 * FreeBSD for some reason. The only thing I can think of
1307		 * is that there was/is some server that replies with
1308		 * more link data than it should?
1309		 */
1310		if (len == NFS_MAXPATHLEN) {
1311			NFSLOCKNODE(np);
1312			if (np->n_size > 0 && np->n_size < NFS_MAXPATHLEN) {
1313				len = np->n_size;
1314				cangetattr = 0;
1315			}
1316			NFSUNLOCKNODE(np);
1317		}
1318		error = nfsm_mbufuio(nd, uiop, len);
1319		if ((nd->nd_flag & ND_NFSV4) && !error && cangetattr)
1320			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1321	}
1322	if (nd->nd_repstat && !error)
1323		error = nd->nd_repstat;
1324nfsmout:
1325	mbuf_freem(nd->nd_mrep);
1326	return (error);
1327}
1328
1329/*
1330 * Read operation.
1331 */
1332APPLESTATIC int
1333nfsrpc_read(vnode_t vp, struct uio *uiop, struct ucred *cred,
1334    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1335{
1336	int error, expireret = 0, retrycnt;
1337	u_int32_t clidrev = 0;
1338	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1339	struct nfsnode *np = VTONFS(vp);
1340	struct ucred *newcred;
1341	struct nfsfh *nfhp = NULL;
1342	nfsv4stateid_t stateid;
1343	void *lckp;
1344
1345	if (nmp->nm_clp != NULL)
1346		clidrev = nmp->nm_clp->nfsc_clientidrev;
1347	newcred = cred;
1348	if (NFSHASNFSV4(nmp)) {
1349		nfhp = np->n_fhp;
1350		newcred = NFSNEWCRED(cred);
1351	}
1352	retrycnt = 0;
1353	do {
1354		lckp = NULL;
1355		if (NFSHASNFSV4(nmp))
1356			(void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1357			    NFSV4OPEN_ACCESSREAD, 0, newcred, p, &stateid,
1358			    &lckp);
1359		error = nfsrpc_readrpc(vp, uiop, newcred, &stateid, p, nap,
1360		    attrflagp, stuff);
1361		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1362			nfscl_initiate_recovery(nmp->nm_clp);
1363		if (lckp != NULL)
1364			nfscl_lockderef(lckp);
1365		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1366		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1367		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1368			(void) nfs_catnap(PZERO, error, "nfs_read");
1369		} else if ((error == NFSERR_EXPIRED ||
1370		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1371			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1372		}
1373		retrycnt++;
1374	} while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1375	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1376	    error == NFSERR_BADSESSION ||
1377	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1378	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1379	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1380	if (error && retrycnt >= 4)
1381		error = EIO;
1382	if (NFSHASNFSV4(nmp))
1383		NFSFREECRED(newcred);
1384	return (error);
1385}
1386
1387/*
1388 * The actual read RPC.
1389 */
1390static int
1391nfsrpc_readrpc(vnode_t vp, struct uio *uiop, struct ucred *cred,
1392    nfsv4stateid_t *stateidp, NFSPROC_T *p, struct nfsvattr *nap,
1393    int *attrflagp, void *stuff)
1394{
1395	u_int32_t *tl;
1396	int error = 0, len, retlen, tsiz, eof = 0;
1397	struct nfsrv_descript nfsd;
1398	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1399	struct nfsrv_descript *nd = &nfsd;
1400	int rsize;
1401	off_t tmp_off;
1402
1403	*attrflagp = 0;
1404	tsiz = uio_uio_resid(uiop);
1405	tmp_off = uiop->uio_offset + tsiz;
1406	NFSLOCKMNT(nmp);
1407	if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1408		NFSUNLOCKMNT(nmp);
1409		return (EFBIG);
1410	}
1411	rsize = nmp->nm_rsize;
1412	NFSUNLOCKMNT(nmp);
1413	nd->nd_mrep = NULL;
1414	while (tsiz > 0) {
1415		*attrflagp = 0;
1416		len = (tsiz > rsize) ? rsize : tsiz;
1417		NFSCL_REQSTART(nd, NFSPROC_READ, vp);
1418		if (nd->nd_flag & ND_NFSV4)
1419			nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1420		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED * 3);
1421		if (nd->nd_flag & ND_NFSV2) {
1422			*tl++ = txdr_unsigned(uiop->uio_offset);
1423			*tl++ = txdr_unsigned(len);
1424			*tl = 0;
1425		} else {
1426			txdr_hyper(uiop->uio_offset, tl);
1427			*(tl + 2) = txdr_unsigned(len);
1428		}
1429		/*
1430		 * Since I can't do a Getattr for NFSv4 for Write, there
1431		 * doesn't seem any point in doing one here, either.
1432		 * (See the comment in nfsrpc_writerpc() for more info.)
1433		 */
1434		error = nfscl_request(nd, vp, p, cred, stuff);
1435		if (error)
1436			return (error);
1437		if (nd->nd_flag & ND_NFSV3) {
1438			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1439		} else if (!nd->nd_repstat && (nd->nd_flag & ND_NFSV2)) {
1440			error = nfsm_loadattr(nd, nap);
1441			if (!error)
1442				*attrflagp = 1;
1443		}
1444		if (nd->nd_repstat || error) {
1445			if (!error)
1446				error = nd->nd_repstat;
1447			goto nfsmout;
1448		}
1449		if (nd->nd_flag & ND_NFSV3) {
1450			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1451			eof = fxdr_unsigned(int, *(tl + 1));
1452		} else if (nd->nd_flag & ND_NFSV4) {
1453			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
1454			eof = fxdr_unsigned(int, *tl);
1455		}
1456		NFSM_STRSIZ(retlen, len);
1457		error = nfsm_mbufuio(nd, uiop, retlen);
1458		if (error)
1459			goto nfsmout;
1460		mbuf_freem(nd->nd_mrep);
1461		nd->nd_mrep = NULL;
1462		tsiz -= retlen;
1463		if (!(nd->nd_flag & ND_NFSV2)) {
1464			if (eof || retlen == 0)
1465				tsiz = 0;
1466		} else if (retlen < len)
1467			tsiz = 0;
1468	}
1469	return (0);
1470nfsmout:
1471	if (nd->nd_mrep != NULL)
1472		mbuf_freem(nd->nd_mrep);
1473	return (error);
1474}
1475
1476/*
1477 * nfs write operation
1478 * When called_from_strategy != 0, it should return EIO for an error that
1479 * indicates recovery is in progress, so that the buffer will be left
1480 * dirty and be written back to the server later. If it loops around,
1481 * the recovery thread could get stuck waiting for the buffer and recovery
1482 * will then deadlock.
1483 */
1484APPLESTATIC int
1485nfsrpc_write(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
1486    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
1487    void *stuff, int called_from_strategy)
1488{
1489	int error, expireret = 0, retrycnt, nostateid;
1490	u_int32_t clidrev = 0;
1491	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1492	struct nfsnode *np = VTONFS(vp);
1493	struct ucred *newcred;
1494	struct nfsfh *nfhp = NULL;
1495	nfsv4stateid_t stateid;
1496	void *lckp;
1497
1498	*must_commit = 0;
1499	if (nmp->nm_clp != NULL)
1500		clidrev = nmp->nm_clp->nfsc_clientidrev;
1501	newcred = cred;
1502	if (NFSHASNFSV4(nmp)) {
1503		newcred = NFSNEWCRED(cred);
1504		nfhp = np->n_fhp;
1505	}
1506	retrycnt = 0;
1507	do {
1508		lckp = NULL;
1509		nostateid = 0;
1510		if (NFSHASNFSV4(nmp)) {
1511			(void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1512			    NFSV4OPEN_ACCESSWRITE, 0, newcred, p, &stateid,
1513			    &lckp);
1514			if (stateid.other[0] == 0 && stateid.other[1] == 0 &&
1515			    stateid.other[2] == 0) {
1516				nostateid = 1;
1517				NFSCL_DEBUG(1, "stateid0 in write\n");
1518			}
1519		}
1520
1521		/*
1522		 * If there is no stateid for NFSv4, it means this is an
1523		 * extraneous write after close. Basically a poorly
1524		 * implemented buffer cache. Just don't do the write.
1525		 */
1526		if (nostateid)
1527			error = 0;
1528		else
1529			error = nfsrpc_writerpc(vp, uiop, iomode, must_commit,
1530			    newcred, &stateid, p, nap, attrflagp, stuff);
1531		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1532			nfscl_initiate_recovery(nmp->nm_clp);
1533		if (lckp != NULL)
1534			nfscl_lockderef(lckp);
1535		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1536		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1537		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1538			(void) nfs_catnap(PZERO, error, "nfs_write");
1539		} else if ((error == NFSERR_EXPIRED ||
1540		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1541			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1542		}
1543		retrycnt++;
1544	} while (error == NFSERR_GRACE || error == NFSERR_DELAY ||
1545	    ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1546	      error == NFSERR_STALEDONTRECOVER) && called_from_strategy == 0) ||
1547	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1548	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1549	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1550	if (error != 0 && (retrycnt >= 4 ||
1551	    ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1552	      error == NFSERR_STALEDONTRECOVER) && called_from_strategy != 0)))
1553		error = EIO;
1554	if (NFSHASNFSV4(nmp))
1555		NFSFREECRED(newcred);
1556	return (error);
1557}
1558
1559/*
1560 * The actual write RPC.
1561 */
1562static int
1563nfsrpc_writerpc(vnode_t vp, struct uio *uiop, int *iomode,
1564    int *must_commit, struct ucred *cred, nfsv4stateid_t *stateidp,
1565    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1566{
1567	u_int32_t *tl;
1568	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1569	struct nfsnode *np = VTONFS(vp);
1570	int error = 0, len, tsiz, rlen, commit, committed = NFSWRITE_FILESYNC;
1571	int wccflag = 0, wsize;
1572	int32_t backup;
1573	struct nfsrv_descript nfsd;
1574	struct nfsrv_descript *nd = &nfsd;
1575	nfsattrbit_t attrbits;
1576	off_t tmp_off;
1577
1578	KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
1579	*attrflagp = 0;
1580	tsiz = uio_uio_resid(uiop);
1581	tmp_off = uiop->uio_offset + tsiz;
1582	NFSLOCKMNT(nmp);
1583	if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1584		NFSUNLOCKMNT(nmp);
1585		return (EFBIG);
1586	}
1587	wsize = nmp->nm_wsize;
1588	NFSUNLOCKMNT(nmp);
1589	nd->nd_mrep = NULL;	/* NFSv2 sometimes does a write with */
1590	nd->nd_repstat = 0;	/* uio_resid == 0, so the while is not done */
1591	while (tsiz > 0) {
1592		*attrflagp = 0;
1593		len = (tsiz > wsize) ? wsize : tsiz;
1594		NFSCL_REQSTART(nd, NFSPROC_WRITE, vp);
1595		if (nd->nd_flag & ND_NFSV4) {
1596			nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1597			NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+2*NFSX_UNSIGNED);
1598			txdr_hyper(uiop->uio_offset, tl);
1599			tl += 2;
1600			*tl++ = txdr_unsigned(*iomode);
1601			*tl = txdr_unsigned(len);
1602		} else if (nd->nd_flag & ND_NFSV3) {
1603			NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+3*NFSX_UNSIGNED);
1604			txdr_hyper(uiop->uio_offset, tl);
1605			tl += 2;
1606			*tl++ = txdr_unsigned(len);
1607			*tl++ = txdr_unsigned(*iomode);
1608			*tl = txdr_unsigned(len);
1609		} else {
1610			u_int32_t x;
1611
1612			NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1613			/*
1614			 * Not sure why someone changed this, since the
1615			 * RFC clearly states that "beginoffset" and
1616			 * "totalcount" are ignored, but it wouldn't
1617			 * surprise me if there's a busted server out there.
1618			 */
1619			/* Set both "begin" and "current" to non-garbage. */
1620			x = txdr_unsigned((u_int32_t)uiop->uio_offset);
1621			*tl++ = x;      /* "begin offset" */
1622			*tl++ = x;      /* "current offset" */
1623			x = txdr_unsigned(len);
1624			*tl++ = x;      /* total to this offset */
1625			*tl = x;        /* size of this write */
1626
1627		}
1628		nfsm_uiombuf(nd, uiop, len);
1629		/*
1630		 * Although it is tempting to do a normal Getattr Op in the
1631		 * NFSv4 compound, the result can be a nearly hung client
1632		 * system if the Getattr asks for Owner and/or OwnerGroup.
1633		 * It occurs when the client can't map either the Owner or
1634		 * Owner_group name in the Getattr reply to a uid/gid. When
1635		 * there is a cache miss, the kernel does an upcall to the
1636		 * nfsuserd. Then, it can try and read the local /etc/passwd
1637		 * or /etc/group file. It can then block in getnewbuf(),
1638		 * waiting for dirty writes to be pushed to the NFS server.
1639		 * The only reason this doesn't result in a complete
1640		 * deadlock, is that the upcall times out and allows
1641		 * the write to complete. However, progress is so slow
1642		 * that it might just as well be deadlocked.
1643		 * As such, we get the rest of the attributes, but not
1644		 * Owner or Owner_group.
1645		 * nb: nfscl_loadattrcache() needs to be told that these
1646		 *     partial attributes from a write rpc are being
1647		 *     passed in, via a argument flag.
1648		 */
1649		if (nd->nd_flag & ND_NFSV4) {
1650			NFSWRITEGETATTR_ATTRBIT(&attrbits);
1651			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1652			*tl = txdr_unsigned(NFSV4OP_GETATTR);
1653			(void) nfsrv_putattrbit(nd, &attrbits);
1654		}
1655		error = nfscl_request(nd, vp, p, cred, stuff);
1656		if (error)
1657			return (error);
1658		if (nd->nd_repstat) {
1659			/*
1660			 * In case the rpc gets retried, roll
1661			 * the uio fileds changed by nfsm_uiombuf()
1662			 * back.
1663			 */
1664			uiop->uio_offset -= len;
1665			uio_uio_resid_add(uiop, len);
1666			uio_iov_base_add(uiop, -len);
1667			uio_iov_len_add(uiop, len);
1668		}
1669		if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1670			error = nfscl_wcc_data(nd, vp, nap, attrflagp,
1671			    &wccflag, stuff);
1672			if (error)
1673				goto nfsmout;
1674		}
1675		if (!nd->nd_repstat) {
1676			if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1677				NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED
1678					+ NFSX_VERF);
1679				rlen = fxdr_unsigned(int, *tl++);
1680				if (rlen == 0) {
1681					error = NFSERR_IO;
1682					goto nfsmout;
1683				} else if (rlen < len) {
1684					backup = len - rlen;
1685					uio_iov_base_add(uiop, -(backup));
1686					uio_iov_len_add(uiop, backup);
1687					uiop->uio_offset -= backup;
1688					uio_uio_resid_add(uiop, backup);
1689					len = rlen;
1690				}
1691				commit = fxdr_unsigned(int, *tl++);
1692
1693				/*
1694				 * Return the lowest committment level
1695				 * obtained by any of the RPCs.
1696				 */
1697				if (committed == NFSWRITE_FILESYNC)
1698					committed = commit;
1699				else if (committed == NFSWRITE_DATASYNC &&
1700					commit == NFSWRITE_UNSTABLE)
1701					committed = commit;
1702				NFSLOCKMNT(nmp);
1703				if (!NFSHASWRITEVERF(nmp)) {
1704					NFSBCOPY((caddr_t)tl,
1705					    (caddr_t)&nmp->nm_verf[0],
1706					    NFSX_VERF);
1707					NFSSETWRITEVERF(nmp);
1708	    			} else if (NFSBCMP(tl, nmp->nm_verf,
1709				    NFSX_VERF)) {
1710					*must_commit = 1;
1711					NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
1712				}
1713				NFSUNLOCKMNT(nmp);
1714			}
1715			if (nd->nd_flag & ND_NFSV4)
1716				NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1717			if (nd->nd_flag & (ND_NFSV2 | ND_NFSV4)) {
1718				error = nfsm_loadattr(nd, nap);
1719				if (!error)
1720					*attrflagp = NFS_LATTR_NOSHRINK;
1721			}
1722		} else {
1723			error = nd->nd_repstat;
1724		}
1725		if (error)
1726			goto nfsmout;
1727		NFSWRITERPC_SETTIME(wccflag, np, (nd->nd_flag & ND_NFSV4));
1728		mbuf_freem(nd->nd_mrep);
1729		nd->nd_mrep = NULL;
1730		tsiz -= len;
1731	}
1732nfsmout:
1733	if (nd->nd_mrep != NULL)
1734		mbuf_freem(nd->nd_mrep);
1735	*iomode = committed;
1736	if (nd->nd_repstat && !error)
1737		error = nd->nd_repstat;
1738	return (error);
1739}
1740
1741/*
1742 * nfs mknod rpc
1743 * For NFS v2 this is a kludge. Use a create rpc but with the IFMT bits of the
1744 * mode set to specify the file type and the size field for rdev.
1745 */
1746APPLESTATIC int
1747nfsrpc_mknod(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1748    u_int32_t rdev, enum vtype vtyp, struct ucred *cred, NFSPROC_T *p,
1749    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1750    int *attrflagp, int *dattrflagp, void *dstuff)
1751{
1752	u_int32_t *tl;
1753	int error = 0;
1754	struct nfsrv_descript nfsd, *nd = &nfsd;
1755	nfsattrbit_t attrbits;
1756
1757	*nfhpp = NULL;
1758	*attrflagp = 0;
1759	*dattrflagp = 0;
1760	if (namelen > NFS_MAXNAMLEN)
1761		return (ENAMETOOLONG);
1762	NFSCL_REQSTART(nd, NFSPROC_MKNOD, dvp);
1763	if (nd->nd_flag & ND_NFSV4) {
1764		if (vtyp == VBLK || vtyp == VCHR) {
1765			NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
1766			*tl++ = vtonfsv34_type(vtyp);
1767			*tl++ = txdr_unsigned(NFSMAJOR(rdev));
1768			*tl = txdr_unsigned(NFSMINOR(rdev));
1769		} else {
1770			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1771			*tl = vtonfsv34_type(vtyp);
1772		}
1773	}
1774	(void) nfsm_strtom(nd, name, namelen);
1775	if (nd->nd_flag & ND_NFSV3) {
1776		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1777		*tl = vtonfsv34_type(vtyp);
1778	}
1779	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1780		nfscl_fillsattr(nd, vap, dvp, 0, 0);
1781	if ((nd->nd_flag & ND_NFSV3) &&
1782	    (vtyp == VCHR || vtyp == VBLK)) {
1783		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1784		*tl++ = txdr_unsigned(NFSMAJOR(rdev));
1785		*tl = txdr_unsigned(NFSMINOR(rdev));
1786	}
1787	if (nd->nd_flag & ND_NFSV4) {
1788		NFSGETATTR_ATTRBIT(&attrbits);
1789		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1790		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
1791		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1792		(void) nfsrv_putattrbit(nd, &attrbits);
1793	}
1794	if (nd->nd_flag & ND_NFSV2)
1795		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZERDEV, rdev);
1796	error = nfscl_request(nd, dvp, p, cred, dstuff);
1797	if (error)
1798		return (error);
1799	if (nd->nd_flag & ND_NFSV4)
1800		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1801	if (!nd->nd_repstat) {
1802		if (nd->nd_flag & ND_NFSV4) {
1803			NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1804			error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1805			if (error)
1806				goto nfsmout;
1807		}
1808		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1809		if (error)
1810			goto nfsmout;
1811	}
1812	if (nd->nd_flag & ND_NFSV3)
1813		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1814	if (!error && nd->nd_repstat)
1815		error = nd->nd_repstat;
1816nfsmout:
1817	mbuf_freem(nd->nd_mrep);
1818	return (error);
1819}
1820
1821/*
1822 * nfs file create call
1823 * Mostly just call the approriate routine. (I separated out v4, so that
1824 * error recovery wouldn't be as difficult.)
1825 */
1826APPLESTATIC int
1827nfsrpc_create(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1828    nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1829    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1830    int *attrflagp, int *dattrflagp, void *dstuff)
1831{
1832	int error = 0, newone, expireret = 0, retrycnt, unlocked;
1833	struct nfsclowner *owp;
1834	struct nfscldeleg *dp;
1835	struct nfsmount *nmp = VFSTONFS(vnode_mount(dvp));
1836	u_int32_t clidrev;
1837
1838	if (NFSHASNFSV4(nmp)) {
1839	    retrycnt = 0;
1840	    do {
1841		dp = NULL;
1842		error = nfscl_open(dvp, NULL, 0, (NFSV4OPEN_ACCESSWRITE |
1843		    NFSV4OPEN_ACCESSREAD), 0, cred, p, &owp, NULL, &newone,
1844		    NULL, 1);
1845		if (error)
1846			return (error);
1847		if (nmp->nm_clp != NULL)
1848			clidrev = nmp->nm_clp->nfsc_clientidrev;
1849		else
1850			clidrev = 0;
1851		error = nfsrpc_createv4(dvp, name, namelen, vap, cverf, fmode,
1852		  owp, &dp, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1853		  dstuff, &unlocked);
1854		/*
1855		 * There is no need to invalidate cached attributes here,
1856		 * since new post-delegation issue attributes are always
1857		 * returned by nfsrpc_createv4() and these will update the
1858		 * attribute cache.
1859		 */
1860		if (dp != NULL)
1861			(void) nfscl_deleg(nmp->nm_mountp, owp->nfsow_clp,
1862			    (*nfhpp)->nfh_fh, (*nfhpp)->nfh_len, cred, p, &dp);
1863		nfscl_ownerrelease(owp, error, newone, unlocked);
1864		if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1865		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1866		    error == NFSERR_BADSESSION) {
1867			(void) nfs_catnap(PZERO, error, "nfs_open");
1868		} else if ((error == NFSERR_EXPIRED ||
1869		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1870			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1871			retrycnt++;
1872		}
1873	    } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1874		error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1875		error == NFSERR_BADSESSION ||
1876		((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1877		 expireret == 0 && clidrev != 0 && retrycnt < 4));
1878	    if (error && retrycnt >= 4)
1879		    error = EIO;
1880	} else {
1881		error = nfsrpc_createv23(dvp, name, namelen, vap, cverf,
1882		    fmode, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1883		    dstuff);
1884	}
1885	return (error);
1886}
1887
1888/*
1889 * The create rpc for v2 and 3.
1890 */
1891static int
1892nfsrpc_createv23(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1893    nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1894    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1895    int *attrflagp, int *dattrflagp, void *dstuff)
1896{
1897	u_int32_t *tl;
1898	int error = 0;
1899	struct nfsrv_descript nfsd, *nd = &nfsd;
1900
1901	*nfhpp = NULL;
1902	*attrflagp = 0;
1903	*dattrflagp = 0;
1904	if (namelen > NFS_MAXNAMLEN)
1905		return (ENAMETOOLONG);
1906	NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1907	(void) nfsm_strtom(nd, name, namelen);
1908	if (nd->nd_flag & ND_NFSV3) {
1909		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1910		if (fmode & O_EXCL) {
1911			*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1912			NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1913			*tl++ = cverf.lval[0];
1914			*tl = cverf.lval[1];
1915		} else {
1916			*tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1917			nfscl_fillsattr(nd, vap, dvp, 0, 0);
1918		}
1919	} else {
1920		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZE0, 0);
1921	}
1922	error = nfscl_request(nd, dvp, p, cred, dstuff);
1923	if (error)
1924		return (error);
1925	if (nd->nd_repstat == 0) {
1926		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1927		if (error)
1928			goto nfsmout;
1929	}
1930	if (nd->nd_flag & ND_NFSV3)
1931		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1932	if (nd->nd_repstat != 0 && error == 0)
1933		error = nd->nd_repstat;
1934nfsmout:
1935	mbuf_freem(nd->nd_mrep);
1936	return (error);
1937}
1938
1939static int
1940nfsrpc_createv4(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1941    nfsquad_t cverf, int fmode, struct nfsclowner *owp, struct nfscldeleg **dpp,
1942    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
1943    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
1944    int *dattrflagp, void *dstuff, int *unlockedp)
1945{
1946	u_int32_t *tl;
1947	int error = 0, deleg, newone, ret, acesize, limitby;
1948	struct nfsrv_descript nfsd, *nd = &nfsd;
1949	struct nfsclopen *op;
1950	struct nfscldeleg *dp = NULL;
1951	struct nfsnode *np;
1952	struct nfsfh *nfhp;
1953	nfsattrbit_t attrbits;
1954	nfsv4stateid_t stateid;
1955	u_int32_t rflags;
1956	struct nfsmount *nmp;
1957
1958	nmp = VFSTONFS(dvp->v_mount);
1959	np = VTONFS(dvp);
1960	*unlockedp = 0;
1961	*nfhpp = NULL;
1962	*dpp = NULL;
1963	*attrflagp = 0;
1964	*dattrflagp = 0;
1965	if (namelen > NFS_MAXNAMLEN)
1966		return (ENAMETOOLONG);
1967	NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1968	/*
1969	 * For V4, this is actually an Open op.
1970	 */
1971	NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1972	*tl++ = txdr_unsigned(owp->nfsow_seqid);
1973	*tl++ = txdr_unsigned(NFSV4OPEN_ACCESSWRITE |
1974	    NFSV4OPEN_ACCESSREAD);
1975	*tl++ = txdr_unsigned(NFSV4OPEN_DENYNONE);
1976	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
1977	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
1978	(void) nfsm_strtom(nd, owp->nfsow_owner, NFSV4CL_LOCKNAMELEN);
1979	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1980	*tl++ = txdr_unsigned(NFSV4OPEN_CREATE);
1981	if (fmode & O_EXCL) {
1982		if (NFSHASNFSV4N(nmp)) {
1983			if (NFSHASSESSPERSIST(nmp)) {
1984				/* Use GUARDED for persistent sessions. */
1985				*tl = txdr_unsigned(NFSCREATE_GUARDED);
1986				nfscl_fillsattr(nd, vap, dvp, 0, 0);
1987			} else {
1988				/* Otherwise, use EXCLUSIVE4_1. */
1989				*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE41);
1990				NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1991				*tl++ = cverf.lval[0];
1992				*tl = cverf.lval[1];
1993				nfscl_fillsattr(nd, vap, dvp, 0, 0);
1994			}
1995		} else {
1996			/* NFSv4.0 */
1997			*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1998			NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1999			*tl++ = cverf.lval[0];
2000			*tl = cverf.lval[1];
2001		}
2002	} else {
2003		*tl = txdr_unsigned(NFSCREATE_UNCHECKED);
2004		nfscl_fillsattr(nd, vap, dvp, 0, 0);
2005	}
2006	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2007	*tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
2008	(void) nfsm_strtom(nd, name, namelen);
2009	/* Get the new file's handle and attributes. */
2010	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2011	*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2012	*tl = txdr_unsigned(NFSV4OP_GETATTR);
2013	NFSGETATTR_ATTRBIT(&attrbits);
2014	(void) nfsrv_putattrbit(nd, &attrbits);
2015	/* Get the directory's post-op attributes. */
2016	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2017	*tl = txdr_unsigned(NFSV4OP_PUTFH);
2018	(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh, np->n_fhp->nfh_len, 0);
2019	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2020	*tl = txdr_unsigned(NFSV4OP_GETATTR);
2021	(void) nfsrv_putattrbit(nd, &attrbits);
2022	error = nfscl_request(nd, dvp, p, cred, dstuff);
2023	if (error)
2024		return (error);
2025	NFSCL_INCRSEQID(owp->nfsow_seqid, nd);
2026	if (nd->nd_repstat == 0) {
2027		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2028		    6 * NFSX_UNSIGNED);
2029		stateid.seqid = *tl++;
2030		stateid.other[0] = *tl++;
2031		stateid.other[1] = *tl++;
2032		stateid.other[2] = *tl;
2033		rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
2034		(void) nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2035		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2036		deleg = fxdr_unsigned(int, *tl);
2037		if (deleg == NFSV4OPEN_DELEGATEREAD ||
2038		    deleg == NFSV4OPEN_DELEGATEWRITE) {
2039			if (!(owp->nfsow_clp->nfsc_flags &
2040			      NFSCLFLAGS_FIRSTDELEG))
2041				owp->nfsow_clp->nfsc_flags |=
2042				  (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
2043			MALLOC(dp, struct nfscldeleg *,
2044			    sizeof (struct nfscldeleg) + NFSX_V4FHMAX,
2045			    M_NFSCLDELEG, M_WAITOK);
2046			LIST_INIT(&dp->nfsdl_owner);
2047			LIST_INIT(&dp->nfsdl_lock);
2048			dp->nfsdl_clp = owp->nfsow_clp;
2049			newnfs_copyincred(cred, &dp->nfsdl_cred);
2050			nfscl_lockinit(&dp->nfsdl_rwlock);
2051			NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2052			    NFSX_UNSIGNED);
2053			dp->nfsdl_stateid.seqid = *tl++;
2054			dp->nfsdl_stateid.other[0] = *tl++;
2055			dp->nfsdl_stateid.other[1] = *tl++;
2056			dp->nfsdl_stateid.other[2] = *tl++;
2057			ret = fxdr_unsigned(int, *tl);
2058			if (deleg == NFSV4OPEN_DELEGATEWRITE) {
2059				dp->nfsdl_flags = NFSCLDL_WRITE;
2060				/*
2061				 * Indicates how much the file can grow.
2062				 */
2063				NFSM_DISSECT(tl, u_int32_t *,
2064				    3 * NFSX_UNSIGNED);
2065				limitby = fxdr_unsigned(int, *tl++);
2066				switch (limitby) {
2067				case NFSV4OPEN_LIMITSIZE:
2068					dp->nfsdl_sizelimit = fxdr_hyper(tl);
2069					break;
2070				case NFSV4OPEN_LIMITBLOCKS:
2071					dp->nfsdl_sizelimit =
2072					    fxdr_unsigned(u_int64_t, *tl++);
2073					dp->nfsdl_sizelimit *=
2074					    fxdr_unsigned(u_int64_t, *tl);
2075					break;
2076				default:
2077					error = NFSERR_BADXDR;
2078					goto nfsmout;
2079				};
2080			} else {
2081				dp->nfsdl_flags = NFSCLDL_READ;
2082			}
2083			if (ret)
2084				dp->nfsdl_flags |= NFSCLDL_RECALL;
2085			error = nfsrv_dissectace(nd, &dp->nfsdl_ace, &ret,
2086			    &acesize, p);
2087			if (error)
2088				goto nfsmout;
2089		} else if (deleg != NFSV4OPEN_DELEGATENONE) {
2090			error = NFSERR_BADXDR;
2091			goto nfsmout;
2092		}
2093		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2094		if (error)
2095			goto nfsmout;
2096		/* Get rid of the PutFH and Getattr status values. */
2097		NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
2098		/* Load the directory attributes. */
2099		error = nfsm_loadattr(nd, dnap);
2100		if (error)
2101			goto nfsmout;
2102		*dattrflagp = 1;
2103		if (dp != NULL && *attrflagp) {
2104			dp->nfsdl_change = nnap->na_filerev;
2105			dp->nfsdl_modtime = nnap->na_mtime;
2106			dp->nfsdl_flags |= NFSCLDL_MODTIMESET;
2107		}
2108		/*
2109		 * We can now complete the Open state.
2110		 */
2111		nfhp = *nfhpp;
2112		if (dp != NULL) {
2113			dp->nfsdl_fhlen = nfhp->nfh_len;
2114			NFSBCOPY(nfhp->nfh_fh, dp->nfsdl_fh, nfhp->nfh_len);
2115		}
2116		/*
2117		 * Get an Open structure that will be
2118		 * attached to the OpenOwner, acquired already.
2119		 */
2120		error = nfscl_open(dvp, nfhp->nfh_fh, nfhp->nfh_len,
2121		    (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), 0,
2122		    cred, p, NULL, &op, &newone, NULL, 0);
2123		if (error)
2124			goto nfsmout;
2125		op->nfso_stateid = stateid;
2126		newnfs_copyincred(cred, &op->nfso_cred);
2127		if ((rflags & NFSV4OPEN_RESULTCONFIRM)) {
2128		    do {
2129			ret = nfsrpc_openconfirm(dvp, nfhp->nfh_fh,
2130			    nfhp->nfh_len, op, cred, p);
2131			if (ret == NFSERR_DELAY)
2132			    (void) nfs_catnap(PZERO, ret, "nfs_create");
2133		    } while (ret == NFSERR_DELAY);
2134		    error = ret;
2135		}
2136
2137		/*
2138		 * If the server is handing out delegations, but we didn't
2139		 * get one because an OpenConfirm was required, try the
2140		 * Open again, to get a delegation. This is a harmless no-op,
2141		 * from a server's point of view.
2142		 */
2143		if ((rflags & NFSV4OPEN_RESULTCONFIRM) &&
2144		    (owp->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG) &&
2145		    !error && dp == NULL) {
2146		    do {
2147			ret = nfsrpc_openrpc(VFSTONFS(vnode_mount(dvp)), dvp,
2148			    np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
2149			    nfhp->nfh_fh, nfhp->nfh_len,
2150			    (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), op,
2151			    name, namelen, &dp, 0, 0x0, cred, p, 0, 1);
2152			if (ret == NFSERR_DELAY)
2153			    (void) nfs_catnap(PZERO, ret, "nfs_crt2");
2154		    } while (ret == NFSERR_DELAY);
2155		    if (ret) {
2156			if (dp != NULL)
2157				FREE((caddr_t)dp, M_NFSCLDELEG);
2158			if (ret == NFSERR_STALECLIENTID ||
2159			    ret == NFSERR_STALEDONTRECOVER ||
2160			    ret == NFSERR_BADSESSION)
2161				error = ret;
2162		    }
2163		}
2164		nfscl_openrelease(op, error, newone);
2165		*unlockedp = 1;
2166	}
2167	if (nd->nd_repstat != 0 && error == 0)
2168		error = nd->nd_repstat;
2169	if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
2170		nfscl_initiate_recovery(owp->nfsow_clp);
2171nfsmout:
2172	if (!error)
2173		*dpp = dp;
2174	else if (dp != NULL)
2175		FREE((caddr_t)dp, M_NFSCLDELEG);
2176	mbuf_freem(nd->nd_mrep);
2177	return (error);
2178}
2179
2180/*
2181 * Nfs remove rpc
2182 */
2183APPLESTATIC int
2184nfsrpc_remove(vnode_t dvp, char *name, int namelen, vnode_t vp,
2185    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp,
2186    void *dstuff)
2187{
2188	u_int32_t *tl;
2189	struct nfsrv_descript nfsd, *nd = &nfsd;
2190	struct nfsnode *np;
2191	struct nfsmount *nmp;
2192	nfsv4stateid_t dstateid;
2193	int error, ret = 0, i;
2194
2195	*dattrflagp = 0;
2196	if (namelen > NFS_MAXNAMLEN)
2197		return (ENAMETOOLONG);
2198	nmp = VFSTONFS(vnode_mount(dvp));
2199tryagain:
2200	if (NFSHASNFSV4(nmp) && ret == 0) {
2201		ret = nfscl_removedeleg(vp, p, &dstateid);
2202		if (ret == 1) {
2203			NFSCL_REQSTART(nd, NFSPROC_RETDELEGREMOVE, vp);
2204			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
2205			    NFSX_UNSIGNED);
2206			if (NFSHASNFSV4N(nmp))
2207				*tl++ = 0;
2208			else
2209				*tl++ = dstateid.seqid;
2210			*tl++ = dstateid.other[0];
2211			*tl++ = dstateid.other[1];
2212			*tl++ = dstateid.other[2];
2213			*tl = txdr_unsigned(NFSV4OP_PUTFH);
2214			np = VTONFS(dvp);
2215			(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2216			    np->n_fhp->nfh_len, 0);
2217			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2218			*tl = txdr_unsigned(NFSV4OP_REMOVE);
2219		}
2220	} else {
2221		ret = 0;
2222	}
2223	if (ret == 0)
2224		NFSCL_REQSTART(nd, NFSPROC_REMOVE, dvp);
2225	(void) nfsm_strtom(nd, name, namelen);
2226	error = nfscl_request(nd, dvp, p, cred, dstuff);
2227	if (error)
2228		return (error);
2229	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2230		/* For NFSv4, parse out any Delereturn replies. */
2231		if (ret > 0 && nd->nd_repstat != 0 &&
2232		    (nd->nd_flag & ND_NOMOREDATA)) {
2233			/*
2234			 * If the Delegreturn failed, try again without
2235			 * it. The server will Recall, as required.
2236			 */
2237			mbuf_freem(nd->nd_mrep);
2238			goto tryagain;
2239		}
2240		for (i = 0; i < (ret * 2); i++) {
2241			if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2242			    ND_NFSV4) {
2243			    NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2244			    if (*(tl + 1))
2245				nd->nd_flag |= ND_NOMOREDATA;
2246			}
2247		}
2248		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2249	}
2250	if (nd->nd_repstat && !error)
2251		error = nd->nd_repstat;
2252nfsmout:
2253	mbuf_freem(nd->nd_mrep);
2254	return (error);
2255}
2256
2257/*
2258 * Do an nfs rename rpc.
2259 */
2260APPLESTATIC int
2261nfsrpc_rename(vnode_t fdvp, vnode_t fvp, char *fnameptr, int fnamelen,
2262    vnode_t tdvp, vnode_t tvp, char *tnameptr, int tnamelen, struct ucred *cred,
2263    NFSPROC_T *p, struct nfsvattr *fnap, struct nfsvattr *tnap,
2264    int *fattrflagp, int *tattrflagp, void *fstuff, void *tstuff)
2265{
2266	u_int32_t *tl;
2267	struct nfsrv_descript nfsd, *nd = &nfsd;
2268	struct nfsmount *nmp;
2269	struct nfsnode *np;
2270	nfsattrbit_t attrbits;
2271	nfsv4stateid_t fdstateid, tdstateid;
2272	int error = 0, ret = 0, gottd = 0, gotfd = 0, i;
2273
2274	*fattrflagp = 0;
2275	*tattrflagp = 0;
2276	nmp = VFSTONFS(vnode_mount(fdvp));
2277	if (fnamelen > NFS_MAXNAMLEN || tnamelen > NFS_MAXNAMLEN)
2278		return (ENAMETOOLONG);
2279tryagain:
2280	if (NFSHASNFSV4(nmp) && ret == 0) {
2281		ret = nfscl_renamedeleg(fvp, &fdstateid, &gotfd, tvp,
2282		    &tdstateid, &gottd, p);
2283		if (gotfd && gottd) {
2284			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME2, fvp);
2285		} else if (gotfd) {
2286			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, fvp);
2287		} else if (gottd) {
2288			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, tvp);
2289		}
2290		if (gotfd) {
2291			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2292			if (NFSHASNFSV4N(nmp))
2293				*tl++ = 0;
2294			else
2295				*tl++ = fdstateid.seqid;
2296			*tl++ = fdstateid.other[0];
2297			*tl++ = fdstateid.other[1];
2298			*tl = fdstateid.other[2];
2299			if (gottd) {
2300				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2301				*tl = txdr_unsigned(NFSV4OP_PUTFH);
2302				np = VTONFS(tvp);
2303				(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2304				    np->n_fhp->nfh_len, 0);
2305				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2306				*tl = txdr_unsigned(NFSV4OP_DELEGRETURN);
2307			}
2308		}
2309		if (gottd) {
2310			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2311			if (NFSHASNFSV4N(nmp))
2312				*tl++ = 0;
2313			else
2314				*tl++ = tdstateid.seqid;
2315			*tl++ = tdstateid.other[0];
2316			*tl++ = tdstateid.other[1];
2317			*tl = tdstateid.other[2];
2318		}
2319		if (ret > 0) {
2320			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2321			*tl = txdr_unsigned(NFSV4OP_PUTFH);
2322			np = VTONFS(fdvp);
2323			(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2324			    np->n_fhp->nfh_len, 0);
2325			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2326			*tl = txdr_unsigned(NFSV4OP_SAVEFH);
2327		}
2328	} else {
2329		ret = 0;
2330	}
2331	if (ret == 0)
2332		NFSCL_REQSTART(nd, NFSPROC_RENAME, fdvp);
2333	if (nd->nd_flag & ND_NFSV4) {
2334		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2335		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2336		NFSWCCATTR_ATTRBIT(&attrbits);
2337		(void) nfsrv_putattrbit(nd, &attrbits);
2338		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2339		*tl = txdr_unsigned(NFSV4OP_PUTFH);
2340		(void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2341		    VTONFS(tdvp)->n_fhp->nfh_len, 0);
2342		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2343		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2344		(void) nfsrv_putattrbit(nd, &attrbits);
2345		nd->nd_flag |= ND_V4WCCATTR;
2346		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2347		*tl = txdr_unsigned(NFSV4OP_RENAME);
2348	}
2349	(void) nfsm_strtom(nd, fnameptr, fnamelen);
2350	if (!(nd->nd_flag & ND_NFSV4))
2351		(void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2352			VTONFS(tdvp)->n_fhp->nfh_len, 0);
2353	(void) nfsm_strtom(nd, tnameptr, tnamelen);
2354	error = nfscl_request(nd, fdvp, p, cred, fstuff);
2355	if (error)
2356		return (error);
2357	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2358		/* For NFSv4, parse out any Delereturn replies. */
2359		if (ret > 0 && nd->nd_repstat != 0 &&
2360		    (nd->nd_flag & ND_NOMOREDATA)) {
2361			/*
2362			 * If the Delegreturn failed, try again without
2363			 * it. The server will Recall, as required.
2364			 */
2365			mbuf_freem(nd->nd_mrep);
2366			goto tryagain;
2367		}
2368		for (i = 0; i < (ret * 2); i++) {
2369			if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2370			    ND_NFSV4) {
2371			    NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2372			    if (*(tl + 1)) {
2373				if (i == 0 && ret > 1) {
2374				    /*
2375				     * If the Delegreturn failed, try again
2376				     * without it. The server will Recall, as
2377				     * required.
2378				     * If ret > 1, the first iteration of this
2379				     * loop is the second DelegReturn result.
2380				     */
2381				    mbuf_freem(nd->nd_mrep);
2382				    goto tryagain;
2383				} else {
2384				    nd->nd_flag |= ND_NOMOREDATA;
2385				}
2386			    }
2387			}
2388		}
2389		/* Now, the first wcc attribute reply. */
2390		if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2391			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2392			if (*(tl + 1))
2393				nd->nd_flag |= ND_NOMOREDATA;
2394		}
2395		error = nfscl_wcc_data(nd, fdvp, fnap, fattrflagp, NULL,
2396		    fstuff);
2397		/* and the second wcc attribute reply. */
2398		if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4 &&
2399		    !error) {
2400			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2401			if (*(tl + 1))
2402				nd->nd_flag |= ND_NOMOREDATA;
2403		}
2404		if (!error)
2405			error = nfscl_wcc_data(nd, tdvp, tnap, tattrflagp,
2406			    NULL, tstuff);
2407	}
2408	if (nd->nd_repstat && !error)
2409		error = nd->nd_repstat;
2410nfsmout:
2411	mbuf_freem(nd->nd_mrep);
2412	return (error);
2413}
2414
2415/*
2416 * nfs hard link create rpc
2417 */
2418APPLESTATIC int
2419nfsrpc_link(vnode_t dvp, vnode_t vp, char *name, int namelen,
2420    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2421    struct nfsvattr *nap, int *attrflagp, int *dattrflagp, void *dstuff)
2422{
2423	u_int32_t *tl;
2424	struct nfsrv_descript nfsd, *nd = &nfsd;
2425	nfsattrbit_t attrbits;
2426	int error = 0;
2427
2428	*attrflagp = 0;
2429	*dattrflagp = 0;
2430	if (namelen > NFS_MAXNAMLEN)
2431		return (ENAMETOOLONG);
2432	NFSCL_REQSTART(nd, NFSPROC_LINK, vp);
2433	if (nd->nd_flag & ND_NFSV4) {
2434		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2435		*tl = txdr_unsigned(NFSV4OP_PUTFH);
2436	}
2437	(void) nfsm_fhtom(nd, VTONFS(dvp)->n_fhp->nfh_fh,
2438		VTONFS(dvp)->n_fhp->nfh_len, 0);
2439	if (nd->nd_flag & ND_NFSV4) {
2440		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2441		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2442		NFSWCCATTR_ATTRBIT(&attrbits);
2443		(void) nfsrv_putattrbit(nd, &attrbits);
2444		nd->nd_flag |= ND_V4WCCATTR;
2445		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2446		*tl = txdr_unsigned(NFSV4OP_LINK);
2447	}
2448	(void) nfsm_strtom(nd, name, namelen);
2449	error = nfscl_request(nd, vp, p, cred, dstuff);
2450	if (error)
2451		return (error);
2452	if (nd->nd_flag & ND_NFSV3) {
2453		error = nfscl_postop_attr(nd, nap, attrflagp, dstuff);
2454		if (!error)
2455			error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2456			    NULL, dstuff);
2457	} else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2458		/*
2459		 * First, parse out the PutFH and Getattr result.
2460		 */
2461		NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2462		if (!(*(tl + 1)))
2463			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2464		if (*(tl + 1))
2465			nd->nd_flag |= ND_NOMOREDATA;
2466		/*
2467		 * Get the pre-op attributes.
2468		 */
2469		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2470	}
2471	if (nd->nd_repstat && !error)
2472		error = nd->nd_repstat;
2473nfsmout:
2474	mbuf_freem(nd->nd_mrep);
2475	return (error);
2476}
2477
2478/*
2479 * nfs symbolic link create rpc
2480 */
2481APPLESTATIC int
2482nfsrpc_symlink(vnode_t dvp, char *name, int namelen, char *target,
2483    struct vattr *vap, struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2484    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2485    int *dattrflagp, void *dstuff)
2486{
2487	u_int32_t *tl;
2488	struct nfsrv_descript nfsd, *nd = &nfsd;
2489	struct nfsmount *nmp;
2490	int slen, error = 0;
2491
2492	*nfhpp = NULL;
2493	*attrflagp = 0;
2494	*dattrflagp = 0;
2495	nmp = VFSTONFS(vnode_mount(dvp));
2496	slen = strlen(target);
2497	if (slen > NFS_MAXPATHLEN || namelen > NFS_MAXNAMLEN)
2498		return (ENAMETOOLONG);
2499	NFSCL_REQSTART(nd, NFSPROC_SYMLINK, dvp);
2500	if (nd->nd_flag & ND_NFSV4) {
2501		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2502		*tl = txdr_unsigned(NFLNK);
2503		(void) nfsm_strtom(nd, target, slen);
2504	}
2505	(void) nfsm_strtom(nd, name, namelen);
2506	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2507		nfscl_fillsattr(nd, vap, dvp, 0, 0);
2508	if (!(nd->nd_flag & ND_NFSV4))
2509		(void) nfsm_strtom(nd, target, slen);
2510	if (nd->nd_flag & ND_NFSV2)
2511		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2512	error = nfscl_request(nd, dvp, p, cred, dstuff);
2513	if (error)
2514		return (error);
2515	if (nd->nd_flag & ND_NFSV4)
2516		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2517	if ((nd->nd_flag & ND_NFSV3) && !error) {
2518		if (!nd->nd_repstat)
2519			error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2520		if (!error)
2521			error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2522			    NULL, dstuff);
2523	}
2524	if (nd->nd_repstat && !error)
2525		error = nd->nd_repstat;
2526	mbuf_freem(nd->nd_mrep);
2527	/*
2528	 * Kludge: Map EEXIST => 0 assuming that it is a reply to a retry.
2529	 */
2530	if (error == EEXIST)
2531		error = 0;
2532	return (error);
2533}
2534
2535/*
2536 * nfs make dir rpc
2537 */
2538APPLESTATIC int
2539nfsrpc_mkdir(vnode_t dvp, char *name, int namelen, struct vattr *vap,
2540    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2541    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2542    int *dattrflagp, void *dstuff)
2543{
2544	u_int32_t *tl;
2545	struct nfsrv_descript nfsd, *nd = &nfsd;
2546	nfsattrbit_t attrbits;
2547	int error = 0;
2548
2549	*nfhpp = NULL;
2550	*attrflagp = 0;
2551	*dattrflagp = 0;
2552	if (namelen > NFS_MAXNAMLEN)
2553		return (ENAMETOOLONG);
2554	NFSCL_REQSTART(nd, NFSPROC_MKDIR, dvp);
2555	if (nd->nd_flag & ND_NFSV4) {
2556		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2557		*tl = txdr_unsigned(NFDIR);
2558	}
2559	(void) nfsm_strtom(nd, name, namelen);
2560	nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2561	if (nd->nd_flag & ND_NFSV4) {
2562		NFSGETATTR_ATTRBIT(&attrbits);
2563		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2564		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2565		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2566		(void) nfsrv_putattrbit(nd, &attrbits);
2567	}
2568	error = nfscl_request(nd, dvp, p, cred, dstuff);
2569	if (error)
2570		return (error);
2571	if (nd->nd_flag & ND_NFSV4)
2572		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2573	if (!nd->nd_repstat && !error) {
2574		if (nd->nd_flag & ND_NFSV4) {
2575			NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2576			error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2577		}
2578		if (!error)
2579			error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2580	}
2581	if ((nd->nd_flag & ND_NFSV3) && !error)
2582		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2583	if (nd->nd_repstat && !error)
2584		error = nd->nd_repstat;
2585nfsmout:
2586	mbuf_freem(nd->nd_mrep);
2587	/*
2588	 * Kludge: Map EEXIST => 0 assuming that you have a reply to a retry.
2589	 */
2590	if (error == EEXIST)
2591		error = 0;
2592	return (error);
2593}
2594
2595/*
2596 * nfs remove directory call
2597 */
2598APPLESTATIC int
2599nfsrpc_rmdir(vnode_t dvp, char *name, int namelen, struct ucred *cred,
2600    NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp, void *dstuff)
2601{
2602	struct nfsrv_descript nfsd, *nd = &nfsd;
2603	int error = 0;
2604
2605	*dattrflagp = 0;
2606	if (namelen > NFS_MAXNAMLEN)
2607		return (ENAMETOOLONG);
2608	NFSCL_REQSTART(nd, NFSPROC_RMDIR, dvp);
2609	(void) nfsm_strtom(nd, name, namelen);
2610	error = nfscl_request(nd, dvp, p, cred, dstuff);
2611	if (error)
2612		return (error);
2613	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2614		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2615	if (nd->nd_repstat && !error)
2616		error = nd->nd_repstat;
2617	mbuf_freem(nd->nd_mrep);
2618	/*
2619	 * Kludge: Map ENOENT => 0 assuming that you have a reply to a retry.
2620	 */
2621	if (error == ENOENT)
2622		error = 0;
2623	return (error);
2624}
2625
2626/*
2627 * Readdir rpc.
2628 * Always returns with either uio_resid unchanged, if you are at the
2629 * end of the directory, or uio_resid == 0, with all DIRBLKSIZ chunks
2630 * filled in.
2631 * I felt this would allow caching of directory blocks more easily
2632 * than returning a pertially filled block.
2633 * Directory offset cookies:
2634 * Oh my, what to do with them...
2635 * I can think of three ways to deal with them:
2636 * 1 - have the layer above these RPCs maintain a map between logical
2637 *     directory byte offsets and the NFS directory offset cookies
2638 * 2 - pass the opaque directory offset cookies up into userland
2639 *     and let the libc functions deal with them, via the system call
2640 * 3 - return them to userland in the "struct dirent", so future versions
2641 *     of libc can use them and do whatever is necessary to amke things work
2642 *     above these rpc calls, in the meantime
2643 * For now, I do #3 by "hiding" the directory offset cookies after the
2644 * d_name field in struct dirent. This is space inside d_reclen that
2645 * will be ignored by anything that doesn't know about them.
2646 * The directory offset cookies are filled in as the last 8 bytes of
2647 * each directory entry, after d_name. Someday, the userland libc
2648 * functions may be able to use these. In the meantime, it satisfies
2649 * OpenBSD's requirements for cookies being returned.
2650 * If expects the directory offset cookie for the read to be in uio_offset
2651 * and returns the one for the next entry after this directory block in
2652 * there, as well.
2653 */
2654APPLESTATIC int
2655nfsrpc_readdir(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
2656    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
2657    int *eofp, void *stuff)
2658{
2659	int len, left;
2660	struct dirent *dp = NULL;
2661	u_int32_t *tl;
2662	nfsquad_t cookie, ncookie;
2663	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
2664	struct nfsnode *dnp = VTONFS(vp);
2665	struct nfsvattr nfsva;
2666	struct nfsrv_descript nfsd, *nd = &nfsd;
2667	int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
2668	int reqsize, tryformoredirs = 1, readsize, eof = 0, gotmnton = 0;
2669	long dotfileid, dotdotfileid = 0;
2670	u_int32_t fakefileno = 0xffffffff, rderr;
2671	char *cp;
2672	nfsattrbit_t attrbits, dattrbits;
2673	u_int32_t *tl2 = NULL;
2674	size_t tresid;
2675
2676	KASSERT(uiop->uio_iovcnt == 1 &&
2677	    (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
2678	    ("nfs readdirrpc bad uio"));
2679
2680	/*
2681	 * There is no point in reading a lot more than uio_resid, however
2682	 * adding one additional DIRBLKSIZ makes sense. Since uio_resid
2683	 * and nm_readdirsize are both exact multiples of DIRBLKSIZ, this
2684	 * will never make readsize > nm_readdirsize.
2685	 */
2686	readsize = nmp->nm_readdirsize;
2687	if (readsize > uio_uio_resid(uiop))
2688		readsize = uio_uio_resid(uiop) + DIRBLKSIZ;
2689
2690	*attrflagp = 0;
2691	if (eofp)
2692		*eofp = 0;
2693	tresid = uio_uio_resid(uiop);
2694	cookie.lval[0] = cookiep->nfsuquad[0];
2695	cookie.lval[1] = cookiep->nfsuquad[1];
2696	nd->nd_mrep = NULL;
2697
2698	/*
2699	 * For NFSv4, first create the "." and ".." entries.
2700	 */
2701	if (NFSHASNFSV4(nmp)) {
2702		reqsize = 6 * NFSX_UNSIGNED;
2703		NFSGETATTR_ATTRBIT(&dattrbits);
2704		NFSZERO_ATTRBIT(&attrbits);
2705		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
2706		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TYPE);
2707		if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
2708		    NFSATTRBIT_MOUNTEDONFILEID)) {
2709			NFSSETBIT_ATTRBIT(&attrbits,
2710			    NFSATTRBIT_MOUNTEDONFILEID);
2711			gotmnton = 1;
2712		} else {
2713			/*
2714			 * Must fake it. Use the fileno, except when the
2715			 * fsid is != to that of the directory. For that
2716			 * case, generate a fake fileno that is not the same.
2717			 */
2718			NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
2719			gotmnton = 0;
2720		}
2721
2722		/*
2723		 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
2724		 */
2725		if (uiop->uio_offset == 0) {
2726			NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
2727			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2728			*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2729			*tl = txdr_unsigned(NFSV4OP_GETATTR);
2730			(void) nfsrv_putattrbit(nd, &attrbits);
2731			error = nfscl_request(nd, vp, p, cred, stuff);
2732			if (error)
2733			    return (error);
2734			dotfileid = 0;	/* Fake out the compiler. */
2735			if ((nd->nd_flag & ND_NOMOREDATA) == 0) {
2736			    error = nfsm_loadattr(nd, &nfsva);
2737			    if (error != 0)
2738				goto nfsmout;
2739			    dotfileid = nfsva.na_fileid;
2740			}
2741			if (nd->nd_repstat == 0) {
2742			    NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2743			    len = fxdr_unsigned(int, *(tl + 4));
2744			    if (len > 0 && len <= NFSX_V4FHMAX)
2745				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2746			    else
2747				error = EPERM;
2748			    if (!error) {
2749				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2750				nfsva.na_mntonfileno = 0xffffffff;
2751				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2752				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2753				    NULL, NULL, NULL, p, cred);
2754				if (error) {
2755				    dotdotfileid = dotfileid;
2756				} else if (gotmnton) {
2757				    if (nfsva.na_mntonfileno != 0xffffffff)
2758					dotdotfileid = nfsva.na_mntonfileno;
2759				    else
2760					dotdotfileid = nfsva.na_fileid;
2761				} else if (nfsva.na_filesid[0] ==
2762				    dnp->n_vattr.na_filesid[0] &&
2763				    nfsva.na_filesid[1] ==
2764				    dnp->n_vattr.na_filesid[1]) {
2765				    dotdotfileid = nfsva.na_fileid;
2766				} else {
2767				    do {
2768					fakefileno--;
2769				    } while (fakefileno ==
2770					nfsva.na_fileid);
2771				    dotdotfileid = fakefileno;
2772				}
2773			    }
2774			} else if (nd->nd_repstat == NFSERR_NOENT) {
2775			    /*
2776			     * Lookupp returns NFSERR_NOENT when we are
2777			     * at the root, so just use the current dir.
2778			     */
2779			    nd->nd_repstat = 0;
2780			    dotdotfileid = dotfileid;
2781			} else {
2782			    error = nd->nd_repstat;
2783			}
2784			mbuf_freem(nd->nd_mrep);
2785			if (error)
2786			    return (error);
2787			nd->nd_mrep = NULL;
2788			dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2789			dp->d_type = DT_DIR;
2790			dp->d_fileno = dotfileid;
2791			dp->d_namlen = 1;
2792			dp->d_name[0] = '.';
2793			dp->d_name[1] = '\0';
2794			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2795			/*
2796			 * Just make these offset cookie 0.
2797			 */
2798			tl = (u_int32_t *)&dp->d_name[4];
2799			*tl++ = 0;
2800			*tl = 0;
2801			blksiz += dp->d_reclen;
2802			uio_uio_resid_add(uiop, -(dp->d_reclen));
2803			uiop->uio_offset += dp->d_reclen;
2804			uio_iov_base_add(uiop, dp->d_reclen);
2805			uio_iov_len_add(uiop, -(dp->d_reclen));
2806			dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2807			dp->d_type = DT_DIR;
2808			dp->d_fileno = dotdotfileid;
2809			dp->d_namlen = 2;
2810			dp->d_name[0] = '.';
2811			dp->d_name[1] = '.';
2812			dp->d_name[2] = '\0';
2813			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2814			/*
2815			 * Just make these offset cookie 0.
2816			 */
2817			tl = (u_int32_t *)&dp->d_name[4];
2818			*tl++ = 0;
2819			*tl = 0;
2820			blksiz += dp->d_reclen;
2821			uio_uio_resid_add(uiop, -(dp->d_reclen));
2822			uiop->uio_offset += dp->d_reclen;
2823			uio_iov_base_add(uiop, dp->d_reclen);
2824			uio_iov_len_add(uiop, -(dp->d_reclen));
2825		}
2826		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_RDATTRERROR);
2827	} else {
2828		reqsize = 5 * NFSX_UNSIGNED;
2829	}
2830
2831
2832	/*
2833	 * Loop around doing readdir rpc's of size readsize.
2834	 * The stopping criteria is EOF or buffer full.
2835	 */
2836	while (more_dirs && bigenough) {
2837		*attrflagp = 0;
2838		NFSCL_REQSTART(nd, NFSPROC_READDIR, vp);
2839		if (nd->nd_flag & ND_NFSV2) {
2840			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2841			*tl++ = cookie.lval[1];
2842			*tl = txdr_unsigned(readsize);
2843		} else {
2844			NFSM_BUILD(tl, u_int32_t *, reqsize);
2845			*tl++ = cookie.lval[0];
2846			*tl++ = cookie.lval[1];
2847			if (cookie.qval == 0) {
2848				*tl++ = 0;
2849				*tl++ = 0;
2850			} else {
2851				NFSLOCKNODE(dnp);
2852				*tl++ = dnp->n_cookieverf.nfsuquad[0];
2853				*tl++ = dnp->n_cookieverf.nfsuquad[1];
2854				NFSUNLOCKNODE(dnp);
2855			}
2856			if (nd->nd_flag & ND_NFSV4) {
2857				*tl++ = txdr_unsigned(readsize);
2858				*tl = txdr_unsigned(readsize);
2859				(void) nfsrv_putattrbit(nd, &attrbits);
2860				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2861				*tl = txdr_unsigned(NFSV4OP_GETATTR);
2862				(void) nfsrv_putattrbit(nd, &dattrbits);
2863			} else {
2864				*tl = txdr_unsigned(readsize);
2865			}
2866		}
2867		error = nfscl_request(nd, vp, p, cred, stuff);
2868		if (error)
2869			return (error);
2870		if (!(nd->nd_flag & ND_NFSV2)) {
2871			if (nd->nd_flag & ND_NFSV3)
2872				error = nfscl_postop_attr(nd, nap, attrflagp,
2873				    stuff);
2874			if (!nd->nd_repstat && !error) {
2875				NFSM_DISSECT(tl, u_int32_t *, NFSX_HYPER);
2876				NFSLOCKNODE(dnp);
2877				dnp->n_cookieverf.nfsuquad[0] = *tl++;
2878				dnp->n_cookieverf.nfsuquad[1] = *tl;
2879				NFSUNLOCKNODE(dnp);
2880			}
2881		}
2882		if (nd->nd_repstat || error) {
2883			if (!error)
2884				error = nd->nd_repstat;
2885			goto nfsmout;
2886		}
2887		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2888		more_dirs = fxdr_unsigned(int, *tl);
2889		if (!more_dirs)
2890			tryformoredirs = 0;
2891
2892		/* loop thru the dir entries, doctoring them to 4bsd form */
2893		while (more_dirs && bigenough) {
2894			if (nd->nd_flag & ND_NFSV4) {
2895				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2896				ncookie.lval[0] = *tl++;
2897				ncookie.lval[1] = *tl++;
2898				len = fxdr_unsigned(int, *tl);
2899			} else if (nd->nd_flag & ND_NFSV3) {
2900				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2901				nfsva.na_fileid = fxdr_hyper(tl);
2902				tl += 2;
2903				len = fxdr_unsigned(int, *tl);
2904			} else {
2905				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2906				nfsva.na_fileid =
2907				    fxdr_unsigned(long, *tl++);
2908				len = fxdr_unsigned(int, *tl);
2909			}
2910			if (len <= 0 || len > NFS_MAXNAMLEN) {
2911				error = EBADRPC;
2912				goto nfsmout;
2913			}
2914			tlen = NFSM_RNDUP(len);
2915			if (tlen == len)
2916				tlen += 4;  /* To ensure null termination */
2917			left = DIRBLKSIZ - blksiz;
2918			if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > left) {
2919				dp->d_reclen += left;
2920				uio_iov_base_add(uiop, left);
2921				uio_iov_len_add(uiop, -(left));
2922				uio_uio_resid_add(uiop, -(left));
2923				uiop->uio_offset += left;
2924				blksiz = 0;
2925			}
2926			if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
2927				bigenough = 0;
2928			if (bigenough) {
2929				dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2930				dp->d_namlen = len;
2931				dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
2932				dp->d_type = DT_UNKNOWN;
2933				blksiz += dp->d_reclen;
2934				if (blksiz == DIRBLKSIZ)
2935					blksiz = 0;
2936				uio_uio_resid_add(uiop, -(DIRHDSIZ));
2937				uiop->uio_offset += DIRHDSIZ;
2938				uio_iov_base_add(uiop, DIRHDSIZ);
2939				uio_iov_len_add(uiop, -(DIRHDSIZ));
2940				error = nfsm_mbufuio(nd, uiop, len);
2941				if (error)
2942					goto nfsmout;
2943				cp = CAST_DOWN(caddr_t, uio_iov_base(uiop));
2944				tlen -= len;
2945				*cp = '\0';	/* null terminate */
2946				cp += tlen;	/* points to cookie storage */
2947				tl2 = (u_int32_t *)cp;
2948				uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
2949				uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
2950				uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
2951				uiop->uio_offset += (tlen + NFSX_HYPER);
2952			} else {
2953				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2954				if (error)
2955					goto nfsmout;
2956			}
2957			if (nd->nd_flag & ND_NFSV4) {
2958				rderr = 0;
2959				nfsva.na_mntonfileno = 0xffffffff;
2960				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2961				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2962				    NULL, NULL, &rderr, p, cred);
2963				if (error)
2964					goto nfsmout;
2965				NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2966			} else if (nd->nd_flag & ND_NFSV3) {
2967				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2968				ncookie.lval[0] = *tl++;
2969				ncookie.lval[1] = *tl++;
2970			} else {
2971				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2972				ncookie.lval[0] = 0;
2973				ncookie.lval[1] = *tl++;
2974			}
2975			if (bigenough) {
2976			    if (nd->nd_flag & ND_NFSV4) {
2977				if (rderr) {
2978				    dp->d_fileno = 0;
2979				} else {
2980				    if (gotmnton) {
2981					if (nfsva.na_mntonfileno != 0xffffffff)
2982					    dp->d_fileno = nfsva.na_mntonfileno;
2983					else
2984					    dp->d_fileno = nfsva.na_fileid;
2985				    } else if (nfsva.na_filesid[0] ==
2986					dnp->n_vattr.na_filesid[0] &&
2987					nfsva.na_filesid[1] ==
2988					dnp->n_vattr.na_filesid[1]) {
2989					dp->d_fileno = nfsva.na_fileid;
2990				    } else {
2991					do {
2992					    fakefileno--;
2993					} while (fakefileno ==
2994					    nfsva.na_fileid);
2995					dp->d_fileno = fakefileno;
2996				    }
2997				    dp->d_type = vtonfs_dtype(nfsva.na_type);
2998				}
2999			    } else {
3000				dp->d_fileno = nfsva.na_fileid;
3001			    }
3002			    *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3003				ncookie.lval[0];
3004			    *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3005				ncookie.lval[1];
3006			}
3007			more_dirs = fxdr_unsigned(int, *tl);
3008		}
3009		/*
3010		 * If at end of rpc data, get the eof boolean
3011		 */
3012		if (!more_dirs) {
3013			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3014			eof = fxdr_unsigned(int, *tl);
3015			if (tryformoredirs)
3016				more_dirs = !eof;
3017			if (nd->nd_flag & ND_NFSV4) {
3018				error = nfscl_postop_attr(nd, nap, attrflagp,
3019				    stuff);
3020				if (error)
3021					goto nfsmout;
3022			}
3023		}
3024		mbuf_freem(nd->nd_mrep);
3025		nd->nd_mrep = NULL;
3026	}
3027	/*
3028	 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3029	 * by increasing d_reclen for the last record.
3030	 */
3031	if (blksiz > 0) {
3032		left = DIRBLKSIZ - blksiz;
3033		dp->d_reclen += left;
3034		uio_iov_base_add(uiop, left);
3035		uio_iov_len_add(uiop, -(left));
3036		uio_uio_resid_add(uiop, -(left));
3037		uiop->uio_offset += left;
3038	}
3039
3040	/*
3041	 * If returning no data, assume end of file.
3042	 * If not bigenough, return not end of file, since you aren't
3043	 *    returning all the data
3044	 * Otherwise, return the eof flag from the server.
3045	 */
3046	if (eofp) {
3047		if (tresid == ((size_t)(uio_uio_resid(uiop))))
3048			*eofp = 1;
3049		else if (!bigenough)
3050			*eofp = 0;
3051		else
3052			*eofp = eof;
3053	}
3054
3055	/*
3056	 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3057	 */
3058	while (uio_uio_resid(uiop) > 0 && ((size_t)(uio_uio_resid(uiop))) != tresid) {
3059		dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
3060		dp->d_type = DT_UNKNOWN;
3061		dp->d_fileno = 0;
3062		dp->d_namlen = 0;
3063		dp->d_name[0] = '\0';
3064		tl = (u_int32_t *)&dp->d_name[4];
3065		*tl++ = cookie.lval[0];
3066		*tl = cookie.lval[1];
3067		dp->d_reclen = DIRBLKSIZ;
3068		uio_iov_base_add(uiop, DIRBLKSIZ);
3069		uio_iov_len_add(uiop, -(DIRBLKSIZ));
3070		uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3071		uiop->uio_offset += DIRBLKSIZ;
3072	}
3073
3074nfsmout:
3075	if (nd->nd_mrep != NULL)
3076		mbuf_freem(nd->nd_mrep);
3077	return (error);
3078}
3079
3080#ifndef APPLE
3081/*
3082 * NFS V3 readdir plus RPC. Used in place of nfsrpc_readdir().
3083 * (Also used for NFS V4 when mount flag set.)
3084 * (ditto above w.r.t. multiple of DIRBLKSIZ, etc.)
3085 */
3086APPLESTATIC int
3087nfsrpc_readdirplus(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
3088    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3089    int *eofp, void *stuff)
3090{
3091	int len, left;
3092	struct dirent *dp = NULL;
3093	u_int32_t *tl;
3094	vnode_t newvp = NULLVP;
3095	struct nfsrv_descript nfsd, *nd = &nfsd;
3096	struct nameidata nami, *ndp = &nami;
3097	struct componentname *cnp = &ndp->ni_cnd;
3098	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3099	struct nfsnode *dnp = VTONFS(vp), *np;
3100	struct nfsvattr nfsva;
3101	struct nfsfh *nfhp;
3102	nfsquad_t cookie, ncookie;
3103	int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
3104	int attrflag, tryformoredirs = 1, eof = 0, gotmnton = 0;
3105	int isdotdot = 0, unlocknewvp = 0;
3106	long dotfileid, dotdotfileid = 0, fileno = 0;
3107	char *cp;
3108	nfsattrbit_t attrbits, dattrbits;
3109	size_t tresid;
3110	u_int32_t *tl2 = NULL, fakefileno = 0xffffffff, rderr;
3111	struct timespec dctime;
3112
3113	KASSERT(uiop->uio_iovcnt == 1 &&
3114	    (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
3115	    ("nfs readdirplusrpc bad uio"));
3116	timespecclear(&dctime);
3117	*attrflagp = 0;
3118	if (eofp != NULL)
3119		*eofp = 0;
3120	ndp->ni_dvp = vp;
3121	nd->nd_mrep = NULL;
3122	cookie.lval[0] = cookiep->nfsuquad[0];
3123	cookie.lval[1] = cookiep->nfsuquad[1];
3124	tresid = uio_uio_resid(uiop);
3125
3126	/*
3127	 * For NFSv4, first create the "." and ".." entries.
3128	 */
3129	if (NFSHASNFSV4(nmp)) {
3130		NFSGETATTR_ATTRBIT(&dattrbits);
3131		NFSZERO_ATTRBIT(&attrbits);
3132		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
3133		if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
3134		    NFSATTRBIT_MOUNTEDONFILEID)) {
3135			NFSSETBIT_ATTRBIT(&attrbits,
3136			    NFSATTRBIT_MOUNTEDONFILEID);
3137			gotmnton = 1;
3138		} else {
3139			/*
3140			 * Must fake it. Use the fileno, except when the
3141			 * fsid is != to that of the directory. For that
3142			 * case, generate a fake fileno that is not the same.
3143			 */
3144			NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
3145			gotmnton = 0;
3146		}
3147
3148		/*
3149		 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
3150		 */
3151		if (uiop->uio_offset == 0) {
3152			NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
3153			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
3154			*tl++ = txdr_unsigned(NFSV4OP_GETFH);
3155			*tl = txdr_unsigned(NFSV4OP_GETATTR);
3156			(void) nfsrv_putattrbit(nd, &attrbits);
3157			error = nfscl_request(nd, vp, p, cred, stuff);
3158			if (error)
3159			    return (error);
3160			dotfileid = 0;	/* Fake out the compiler. */
3161			if ((nd->nd_flag & ND_NOMOREDATA) == 0) {
3162			    error = nfsm_loadattr(nd, &nfsva);
3163			    if (error != 0)
3164				goto nfsmout;
3165			    dctime = nfsva.na_ctime;
3166			    dotfileid = nfsva.na_fileid;
3167			}
3168			if (nd->nd_repstat == 0) {
3169			    NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
3170			    len = fxdr_unsigned(int, *(tl + 4));
3171			    if (len > 0 && len <= NFSX_V4FHMAX)
3172				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3173			    else
3174				error = EPERM;
3175			    if (!error) {
3176				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
3177				nfsva.na_mntonfileno = 0xffffffff;
3178				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
3179				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3180				    NULL, NULL, NULL, p, cred);
3181				if (error) {
3182				    dotdotfileid = dotfileid;
3183				} else if (gotmnton) {
3184				    if (nfsva.na_mntonfileno != 0xffffffff)
3185					dotdotfileid = nfsva.na_mntonfileno;
3186				    else
3187					dotdotfileid = nfsva.na_fileid;
3188				} else if (nfsva.na_filesid[0] ==
3189				    dnp->n_vattr.na_filesid[0] &&
3190				    nfsva.na_filesid[1] ==
3191				    dnp->n_vattr.na_filesid[1]) {
3192				    dotdotfileid = nfsva.na_fileid;
3193				} else {
3194				    do {
3195					fakefileno--;
3196				    } while (fakefileno ==
3197					nfsva.na_fileid);
3198				    dotdotfileid = fakefileno;
3199				}
3200			    }
3201			} else if (nd->nd_repstat == NFSERR_NOENT) {
3202			    /*
3203			     * Lookupp returns NFSERR_NOENT when we are
3204			     * at the root, so just use the current dir.
3205			     */
3206			    nd->nd_repstat = 0;
3207			    dotdotfileid = dotfileid;
3208			} else {
3209			    error = nd->nd_repstat;
3210			}
3211			mbuf_freem(nd->nd_mrep);
3212			if (error)
3213			    return (error);
3214			nd->nd_mrep = NULL;
3215			dp = (struct dirent *)uio_iov_base(uiop);
3216			dp->d_type = DT_DIR;
3217			dp->d_fileno = dotfileid;
3218			dp->d_namlen = 1;
3219			dp->d_name[0] = '.';
3220			dp->d_name[1] = '\0';
3221			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3222			/*
3223			 * Just make these offset cookie 0.
3224			 */
3225			tl = (u_int32_t *)&dp->d_name[4];
3226			*tl++ = 0;
3227			*tl = 0;
3228			blksiz += dp->d_reclen;
3229			uio_uio_resid_add(uiop, -(dp->d_reclen));
3230			uiop->uio_offset += dp->d_reclen;
3231			uio_iov_base_add(uiop, dp->d_reclen);
3232			uio_iov_len_add(uiop, -(dp->d_reclen));
3233			dp = (struct dirent *)uio_iov_base(uiop);
3234			dp->d_type = DT_DIR;
3235			dp->d_fileno = dotdotfileid;
3236			dp->d_namlen = 2;
3237			dp->d_name[0] = '.';
3238			dp->d_name[1] = '.';
3239			dp->d_name[2] = '\0';
3240			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3241			/*
3242			 * Just make these offset cookie 0.
3243			 */
3244			tl = (u_int32_t *)&dp->d_name[4];
3245			*tl++ = 0;
3246			*tl = 0;
3247			blksiz += dp->d_reclen;
3248			uio_uio_resid_add(uiop, -(dp->d_reclen));
3249			uiop->uio_offset += dp->d_reclen;
3250			uio_iov_base_add(uiop, dp->d_reclen);
3251			uio_iov_len_add(uiop, -(dp->d_reclen));
3252		}
3253		NFSREADDIRPLUS_ATTRBIT(&attrbits);
3254		if (gotmnton)
3255			NFSSETBIT_ATTRBIT(&attrbits,
3256			    NFSATTRBIT_MOUNTEDONFILEID);
3257	}
3258
3259	/*
3260	 * Loop around doing readdir rpc's of size nm_readdirsize.
3261	 * The stopping criteria is EOF or buffer full.
3262	 */
3263	while (more_dirs && bigenough) {
3264		*attrflagp = 0;
3265		NFSCL_REQSTART(nd, NFSPROC_READDIRPLUS, vp);
3266 		NFSM_BUILD(tl, u_int32_t *, 6 * NFSX_UNSIGNED);
3267		*tl++ = cookie.lval[0];
3268		*tl++ = cookie.lval[1];
3269		if (cookie.qval == 0) {
3270			*tl++ = 0;
3271			*tl++ = 0;
3272		} else {
3273			NFSLOCKNODE(dnp);
3274			*tl++ = dnp->n_cookieverf.nfsuquad[0];
3275			*tl++ = dnp->n_cookieverf.nfsuquad[1];
3276			NFSUNLOCKNODE(dnp);
3277		}
3278		*tl++ = txdr_unsigned(nmp->nm_readdirsize);
3279		*tl = txdr_unsigned(nmp->nm_readdirsize);
3280		if (nd->nd_flag & ND_NFSV4) {
3281			(void) nfsrv_putattrbit(nd, &attrbits);
3282			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3283			*tl = txdr_unsigned(NFSV4OP_GETATTR);
3284			(void) nfsrv_putattrbit(nd, &dattrbits);
3285		}
3286		error = nfscl_request(nd, vp, p, cred, stuff);
3287		if (error)
3288			return (error);
3289		if (nd->nd_flag & ND_NFSV3)
3290			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3291		if (nd->nd_repstat || error) {
3292			if (!error)
3293				error = nd->nd_repstat;
3294			goto nfsmout;
3295		}
3296		if ((nd->nd_flag & ND_NFSV3) != 0 && *attrflagp != 0)
3297			dctime = nap->na_ctime;
3298		NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3299		NFSLOCKNODE(dnp);
3300		dnp->n_cookieverf.nfsuquad[0] = *tl++;
3301		dnp->n_cookieverf.nfsuquad[1] = *tl++;
3302		NFSUNLOCKNODE(dnp);
3303		more_dirs = fxdr_unsigned(int, *tl);
3304		if (!more_dirs)
3305			tryformoredirs = 0;
3306
3307		/* loop thru the dir entries, doctoring them to 4bsd form */
3308		while (more_dirs && bigenough) {
3309			NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3310			if (nd->nd_flag & ND_NFSV4) {
3311				ncookie.lval[0] = *tl++;
3312				ncookie.lval[1] = *tl++;
3313			} else {
3314				fileno = fxdr_unsigned(long, *++tl);
3315				tl++;
3316			}
3317			len = fxdr_unsigned(int, *tl);
3318			if (len <= 0 || len > NFS_MAXNAMLEN) {
3319				error = EBADRPC;
3320				goto nfsmout;
3321			}
3322			tlen = NFSM_RNDUP(len);
3323			if (tlen == len)
3324				tlen += 4;  /* To ensure null termination */
3325			left = DIRBLKSIZ - blksiz;
3326			if ((tlen + DIRHDSIZ + NFSX_HYPER) > left) {
3327				dp->d_reclen += left;
3328				uio_iov_base_add(uiop, left);
3329				uio_iov_len_add(uiop, -(left));
3330				uio_uio_resid_add(uiop, -(left));
3331				uiop->uio_offset += left;
3332				blksiz = 0;
3333			}
3334			if ((tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
3335				bigenough = 0;
3336			if (bigenough) {
3337				dp = (struct dirent *)uio_iov_base(uiop);
3338				dp->d_namlen = len;
3339				dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
3340				dp->d_type = DT_UNKNOWN;
3341				blksiz += dp->d_reclen;
3342				if (blksiz == DIRBLKSIZ)
3343					blksiz = 0;
3344				uio_uio_resid_add(uiop, -(DIRHDSIZ));
3345				uiop->uio_offset += DIRHDSIZ;
3346				uio_iov_base_add(uiop, DIRHDSIZ);
3347				uio_iov_len_add(uiop, -(DIRHDSIZ));
3348				cnp->cn_nameptr = uio_iov_base(uiop);
3349				cnp->cn_namelen = len;
3350				NFSCNHASHZERO(cnp);
3351				error = nfsm_mbufuio(nd, uiop, len);
3352				if (error)
3353					goto nfsmout;
3354				cp = uio_iov_base(uiop);
3355				tlen -= len;
3356				*cp = '\0';
3357				cp += tlen;	/* points to cookie storage */
3358				tl2 = (u_int32_t *)cp;
3359				if (len == 2 && cnp->cn_nameptr[0] == '.' &&
3360				    cnp->cn_nameptr[1] == '.')
3361					isdotdot = 1;
3362				else
3363					isdotdot = 0;
3364				uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
3365				uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
3366				uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
3367				uiop->uio_offset += (tlen + NFSX_HYPER);
3368			} else {
3369				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3370				if (error)
3371					goto nfsmout;
3372			}
3373			nfhp = NULL;
3374			if (nd->nd_flag & ND_NFSV3) {
3375				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3376				ncookie.lval[0] = *tl++;
3377				ncookie.lval[1] = *tl++;
3378				attrflag = fxdr_unsigned(int, *tl);
3379				if (attrflag) {
3380				  error = nfsm_loadattr(nd, &nfsva);
3381				  if (error)
3382					goto nfsmout;
3383				}
3384				NFSM_DISSECT(tl,u_int32_t *,NFSX_UNSIGNED);
3385				if (*tl) {
3386					error = nfsm_getfh(nd, &nfhp);
3387					if (error)
3388					    goto nfsmout;
3389				}
3390				if (!attrflag && nfhp != NULL) {
3391					FREE((caddr_t)nfhp, M_NFSFH);
3392					nfhp = NULL;
3393				}
3394			} else {
3395				rderr = 0;
3396				nfsva.na_mntonfileno = 0xffffffff;
3397				error = nfsv4_loadattr(nd, NULL, &nfsva, &nfhp,
3398				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3399				    NULL, NULL, &rderr, p, cred);
3400				if (error)
3401					goto nfsmout;
3402			}
3403
3404			if (bigenough) {
3405			    if (nd->nd_flag & ND_NFSV4) {
3406				if (rderr) {
3407				    dp->d_fileno = 0;
3408				} else if (gotmnton) {
3409				    if (nfsva.na_mntonfileno != 0xffffffff)
3410					dp->d_fileno = nfsva.na_mntonfileno;
3411				    else
3412					dp->d_fileno = nfsva.na_fileid;
3413				} else if (nfsva.na_filesid[0] ==
3414				    dnp->n_vattr.na_filesid[0] &&
3415				    nfsva.na_filesid[1] ==
3416				    dnp->n_vattr.na_filesid[1]) {
3417				    dp->d_fileno = nfsva.na_fileid;
3418				} else {
3419				    do {
3420					fakefileno--;
3421				    } while (fakefileno ==
3422					nfsva.na_fileid);
3423				    dp->d_fileno = fakefileno;
3424				}
3425			    } else {
3426				dp->d_fileno = fileno;
3427			    }
3428			    *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3429				ncookie.lval[0];
3430			    *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3431				ncookie.lval[1];
3432
3433			    if (nfhp != NULL) {
3434				if (NFSRV_CMPFH(nfhp->nfh_fh, nfhp->nfh_len,
3435				    dnp->n_fhp->nfh_fh, dnp->n_fhp->nfh_len)) {
3436				    VREF(vp);
3437				    newvp = vp;
3438				    unlocknewvp = 0;
3439				    FREE((caddr_t)nfhp, M_NFSFH);
3440				    np = dnp;
3441				} else if (isdotdot != 0) {
3442				    /*
3443				     * Skip doing a nfscl_nget() call for "..".
3444				     * There's a race between acquiring the nfs
3445				     * node here and lookups that look for the
3446				     * directory being read (in the parent).
3447				     * It would try to get a lock on ".." here,
3448				     * owning the lock on the directory being
3449				     * read. Lookup will hold the lock on ".."
3450				     * and try to acquire the lock on the
3451				     * directory being read.
3452				     * If the directory is unlocked/relocked,
3453				     * then there is a LOR with the buflock
3454				     * vp is relocked.
3455				     */
3456				    free(nfhp, M_NFSFH);
3457				} else {
3458				    error = nfscl_nget(vnode_mount(vp), vp,
3459				      nfhp, cnp, p, &np, NULL, LK_EXCLUSIVE);
3460				    if (!error) {
3461					newvp = NFSTOV(np);
3462					unlocknewvp = 1;
3463				    }
3464				}
3465				nfhp = NULL;
3466				if (newvp != NULLVP) {
3467				    error = nfscl_loadattrcache(&newvp,
3468					&nfsva, NULL, NULL, 0, 0);
3469				    if (error) {
3470					if (unlocknewvp)
3471					    vput(newvp);
3472					else
3473					    vrele(newvp);
3474					goto nfsmout;
3475				    }
3476				    dp->d_type =
3477					vtonfs_dtype(np->n_vattr.na_type);
3478				    ndp->ni_vp = newvp;
3479				    NFSCNHASH(cnp, HASHINIT);
3480				    if (cnp->cn_namelen <= NCHNAMLEN &&
3481					(newvp->v_type != VDIR ||
3482					 dctime.tv_sec != 0)) {
3483					cache_enter_time(ndp->ni_dvp,
3484					    ndp->ni_vp, cnp,
3485					    &nfsva.na_ctime,
3486					    newvp->v_type != VDIR ? NULL :
3487					    &dctime);
3488				    }
3489				    if (unlocknewvp)
3490					vput(newvp);
3491				    else
3492					vrele(newvp);
3493				    newvp = NULLVP;
3494				}
3495			    }
3496			} else if (nfhp != NULL) {
3497			    FREE((caddr_t)nfhp, M_NFSFH);
3498			}
3499			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3500			more_dirs = fxdr_unsigned(int, *tl);
3501		}
3502		/*
3503		 * If at end of rpc data, get the eof boolean
3504		 */
3505		if (!more_dirs) {
3506			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3507			eof = fxdr_unsigned(int, *tl);
3508			if (tryformoredirs)
3509				more_dirs = !eof;
3510			if (nd->nd_flag & ND_NFSV4) {
3511				error = nfscl_postop_attr(nd, nap, attrflagp,
3512				    stuff);
3513				if (error)
3514					goto nfsmout;
3515			}
3516		}
3517		mbuf_freem(nd->nd_mrep);
3518		nd->nd_mrep = NULL;
3519	}
3520	/*
3521	 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3522	 * by increasing d_reclen for the last record.
3523	 */
3524	if (blksiz > 0) {
3525		left = DIRBLKSIZ - blksiz;
3526		dp->d_reclen += left;
3527		uio_iov_base_add(uiop, left);
3528		uio_iov_len_add(uiop, -(left));
3529		uio_uio_resid_add(uiop, -(left));
3530		uiop->uio_offset += left;
3531	}
3532
3533	/*
3534	 * If returning no data, assume end of file.
3535	 * If not bigenough, return not end of file, since you aren't
3536	 *    returning all the data
3537	 * Otherwise, return the eof flag from the server.
3538	 */
3539	if (eofp != NULL) {
3540		if (tresid == uio_uio_resid(uiop))
3541			*eofp = 1;
3542		else if (!bigenough)
3543			*eofp = 0;
3544		else
3545			*eofp = eof;
3546	}
3547
3548	/*
3549	 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3550	 */
3551	while (uio_uio_resid(uiop) > 0 && uio_uio_resid(uiop) != tresid) {
3552		dp = (struct dirent *)uio_iov_base(uiop);
3553		dp->d_type = DT_UNKNOWN;
3554		dp->d_fileno = 0;
3555		dp->d_namlen = 0;
3556		dp->d_name[0] = '\0';
3557		tl = (u_int32_t *)&dp->d_name[4];
3558		*tl++ = cookie.lval[0];
3559		*tl = cookie.lval[1];
3560		dp->d_reclen = DIRBLKSIZ;
3561		uio_iov_base_add(uiop, DIRBLKSIZ);
3562		uio_iov_len_add(uiop, -(DIRBLKSIZ));
3563		uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3564		uiop->uio_offset += DIRBLKSIZ;
3565	}
3566
3567nfsmout:
3568	if (nd->nd_mrep != NULL)
3569		mbuf_freem(nd->nd_mrep);
3570	return (error);
3571}
3572#endif	/* !APPLE */
3573
3574/*
3575 * Nfs commit rpc
3576 */
3577APPLESTATIC int
3578nfsrpc_commit(vnode_t vp, u_quad_t offset, int cnt, struct ucred *cred,
3579    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
3580{
3581	u_int32_t *tl;
3582	struct nfsrv_descript nfsd, *nd = &nfsd;
3583	nfsattrbit_t attrbits;
3584	int error;
3585	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3586
3587	*attrflagp = 0;
3588	NFSCL_REQSTART(nd, NFSPROC_COMMIT, vp);
3589	NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3590	txdr_hyper(offset, tl);
3591	tl += 2;
3592	*tl = txdr_unsigned(cnt);
3593	if (nd->nd_flag & ND_NFSV4) {
3594		/*
3595		 * And do a Getattr op.
3596		 */
3597		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3598		*tl = txdr_unsigned(NFSV4OP_GETATTR);
3599		NFSGETATTR_ATTRBIT(&attrbits);
3600		(void) nfsrv_putattrbit(nd, &attrbits);
3601	}
3602	error = nfscl_request(nd, vp, p, cred, stuff);
3603	if (error)
3604		return (error);
3605	error = nfscl_wcc_data(nd, vp, nap, attrflagp, NULL, stuff);
3606	if (!error && !nd->nd_repstat) {
3607		NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
3608		NFSLOCKMNT(nmp);
3609		if (NFSBCMP(nmp->nm_verf, tl, NFSX_VERF)) {
3610			NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
3611			nd->nd_repstat = NFSERR_STALEWRITEVERF;
3612		}
3613		NFSUNLOCKMNT(nmp);
3614		if (nd->nd_flag & ND_NFSV4)
3615			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3616	}
3617nfsmout:
3618	if (!error && nd->nd_repstat)
3619		error = nd->nd_repstat;
3620	mbuf_freem(nd->nd_mrep);
3621	return (error);
3622}
3623
3624/*
3625 * NFS byte range lock rpc.
3626 * (Mostly just calls one of the three lower level RPC routines.)
3627 */
3628APPLESTATIC int
3629nfsrpc_advlock(vnode_t vp, off_t size, int op, struct flock *fl,
3630    int reclaim, struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3631{
3632	struct nfscllockowner *lp;
3633	struct nfsclclient *clp;
3634	struct nfsfh *nfhp;
3635	struct nfsrv_descript nfsd, *nd = &nfsd;
3636	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3637	u_int64_t off, len;
3638	off_t start, end;
3639	u_int32_t clidrev = 0;
3640	int error = 0, newone = 0, expireret = 0, retrycnt, donelocally;
3641	int callcnt, dorpc;
3642
3643	/*
3644	 * Convert the flock structure into a start and end and do POSIX
3645	 * bounds checking.
3646	 */
3647	switch (fl->l_whence) {
3648	case SEEK_SET:
3649	case SEEK_CUR:
3650		/*
3651		 * Caller is responsible for adding any necessary offset
3652		 * when SEEK_CUR is used.
3653		 */
3654		start = fl->l_start;
3655		off = fl->l_start;
3656		break;
3657	case SEEK_END:
3658		start = size + fl->l_start;
3659		off = size + fl->l_start;
3660		break;
3661	default:
3662		return (EINVAL);
3663	};
3664	if (start < 0)
3665		return (EINVAL);
3666	if (fl->l_len != 0) {
3667		end = start + fl->l_len - 1;
3668		if (end < start)
3669			return (EINVAL);
3670	}
3671
3672	len = fl->l_len;
3673	if (len == 0)
3674		len = NFS64BITSSET;
3675	retrycnt = 0;
3676	do {
3677	    nd->nd_repstat = 0;
3678	    if (op == F_GETLK) {
3679		error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3680		if (error)
3681			return (error);
3682		error = nfscl_lockt(vp, clp, off, len, fl, p, id, flags);
3683		if (!error) {
3684			clidrev = clp->nfsc_clientidrev;
3685			error = nfsrpc_lockt(nd, vp, clp, off, len, fl, cred,
3686			    p, id, flags);
3687		} else if (error == -1) {
3688			error = 0;
3689		}
3690		nfscl_clientrelease(clp);
3691	    } else if (op == F_UNLCK && fl->l_type == F_UNLCK) {
3692		/*
3693		 * We must loop around for all lockowner cases.
3694		 */
3695		callcnt = 0;
3696		error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3697		if (error)
3698			return (error);
3699		do {
3700		    error = nfscl_relbytelock(vp, off, len, cred, p, callcnt,
3701			clp, id, flags, &lp, &dorpc);
3702		    /*
3703		     * If it returns a NULL lp, we're done.
3704		     */
3705		    if (lp == NULL) {
3706			if (callcnt == 0)
3707			    nfscl_clientrelease(clp);
3708			else
3709			    nfscl_releasealllocks(clp, vp, p, id, flags);
3710			return (error);
3711		    }
3712		    if (nmp->nm_clp != NULL)
3713			clidrev = nmp->nm_clp->nfsc_clientidrev;
3714		    else
3715			clidrev = 0;
3716		    /*
3717		     * If the server doesn't support Posix lock semantics,
3718		     * only allow locks on the entire file, since it won't
3719		     * handle overlapping byte ranges.
3720		     * There might still be a problem when a lock
3721		     * upgrade/downgrade (read<->write) occurs, since the
3722		     * server "might" expect an unlock first?
3723		     */
3724		    if (dorpc && (lp->nfsl_open->nfso_posixlock ||
3725			(off == 0 && len == NFS64BITSSET))) {
3726			/*
3727			 * Since the lock records will go away, we must
3728			 * wait for grace and delay here.
3729			 */
3730			do {
3731			    error = nfsrpc_locku(nd, nmp, lp, off, len,
3732				NFSV4LOCKT_READ, cred, p, 0);
3733			    if ((nd->nd_repstat == NFSERR_GRACE ||
3734				 nd->nd_repstat == NFSERR_DELAY) &&
3735				error == 0)
3736				(void) nfs_catnap(PZERO, (int)nd->nd_repstat,
3737				    "nfs_advlock");
3738			} while ((nd->nd_repstat == NFSERR_GRACE ||
3739			    nd->nd_repstat == NFSERR_DELAY) && error == 0);
3740		    }
3741		    callcnt++;
3742		} while (error == 0 && nd->nd_repstat == 0);
3743		nfscl_releasealllocks(clp, vp, p, id, flags);
3744	    } else if (op == F_SETLK) {
3745		error = nfscl_getbytelock(vp, off, len, fl->l_type, cred, p,
3746		    NULL, 0, id, flags, NULL, NULL, &lp, &newone, &donelocally);
3747		if (error || donelocally) {
3748			return (error);
3749		}
3750		if (nmp->nm_clp != NULL)
3751			clidrev = nmp->nm_clp->nfsc_clientidrev;
3752		else
3753			clidrev = 0;
3754		nfhp = VTONFS(vp)->n_fhp;
3755		if (!lp->nfsl_open->nfso_posixlock &&
3756		    (off != 0 || len != NFS64BITSSET)) {
3757			error = EINVAL;
3758		} else {
3759			error = nfsrpc_lock(nd, nmp, vp, nfhp->nfh_fh,
3760			    nfhp->nfh_len, lp, newone, reclaim, off,
3761			    len, fl->l_type, cred, p, 0);
3762		}
3763		if (!error)
3764			error = nd->nd_repstat;
3765		nfscl_lockrelease(lp, error, newone);
3766	    } else {
3767		error = EINVAL;
3768	    }
3769	    if (!error)
3770	        error = nd->nd_repstat;
3771	    if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
3772		error == NFSERR_STALEDONTRECOVER ||
3773		error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3774		error == NFSERR_BADSESSION) {
3775		(void) nfs_catnap(PZERO, error, "nfs_advlock");
3776	    } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
3777		&& clidrev != 0) {
3778		expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
3779		retrycnt++;
3780	    }
3781	} while (error == NFSERR_GRACE ||
3782	    error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3783	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_STALESTATEID ||
3784	    error == NFSERR_BADSESSION ||
3785	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
3786	     expireret == 0 && clidrev != 0 && retrycnt < 4));
3787	if (error && retrycnt >= 4)
3788		error = EIO;
3789	return (error);
3790}
3791
3792/*
3793 * The lower level routine for the LockT case.
3794 */
3795APPLESTATIC int
3796nfsrpc_lockt(struct nfsrv_descript *nd, vnode_t vp,
3797    struct nfsclclient *clp, u_int64_t off, u_int64_t len, struct flock *fl,
3798    struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3799{
3800	u_int32_t *tl;
3801	int error, type, size;
3802	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3803	struct nfsnode *np;
3804	struct nfsmount *nmp;
3805
3806	nmp = VFSTONFS(vp->v_mount);
3807	NFSCL_REQSTART(nd, NFSPROC_LOCKT, vp);
3808	NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3809	if (fl->l_type == F_RDLCK)
3810		*tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3811	else
3812		*tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3813	txdr_hyper(off, tl);
3814	tl += 2;
3815	txdr_hyper(len, tl);
3816	tl += 2;
3817	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3818	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3819	nfscl_filllockowner(id, own, flags);
3820	np = VTONFS(vp);
3821	NFSBCOPY(np->n_fhp->nfh_fh, &own[NFSV4CL_LOCKNAMELEN],
3822	    np->n_fhp->nfh_len);
3823	(void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + np->n_fhp->nfh_len);
3824	error = nfscl_request(nd, vp, p, cred, NULL);
3825	if (error)
3826		return (error);
3827	if (nd->nd_repstat == 0) {
3828		fl->l_type = F_UNLCK;
3829	} else if (nd->nd_repstat == NFSERR_DENIED) {
3830		nd->nd_repstat = 0;
3831		fl->l_whence = SEEK_SET;
3832		NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3833		fl->l_start = fxdr_hyper(tl);
3834		tl += 2;
3835		len = fxdr_hyper(tl);
3836		tl += 2;
3837		if (len == NFS64BITSSET)
3838			fl->l_len = 0;
3839		else
3840			fl->l_len = len;
3841		type = fxdr_unsigned(int, *tl++);
3842		if (type == NFSV4LOCKT_WRITE)
3843			fl->l_type = F_WRLCK;
3844		else
3845			fl->l_type = F_RDLCK;
3846		/*
3847		 * XXX For now, I have no idea what to do with the
3848		 * conflicting lock_owner, so I'll just set the pid == 0
3849		 * and skip over the lock_owner.
3850		 */
3851		fl->l_pid = (pid_t)0;
3852		tl += 2;
3853		size = fxdr_unsigned(int, *tl);
3854		if (size < 0 || size > NFSV4_OPAQUELIMIT)
3855			error = EBADRPC;
3856		if (!error)
3857			error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3858	} else if (nd->nd_repstat == NFSERR_STALECLIENTID ||
3859	    nd->nd_repstat == NFSERR_BADSESSION)
3860		nfscl_initiate_recovery(clp);
3861nfsmout:
3862	mbuf_freem(nd->nd_mrep);
3863	return (error);
3864}
3865
3866/*
3867 * Lower level function that performs the LockU RPC.
3868 */
3869static int
3870nfsrpc_locku(struct nfsrv_descript *nd, struct nfsmount *nmp,
3871    struct nfscllockowner *lp, u_int64_t off, u_int64_t len,
3872    u_int32_t type, struct ucred *cred, NFSPROC_T *p, int syscred)
3873{
3874	u_int32_t *tl;
3875	int error;
3876
3877	nfscl_reqstart(nd, NFSPROC_LOCKU, nmp, lp->nfsl_open->nfso_fh,
3878	    lp->nfsl_open->nfso_fhlen, NULL, NULL);
3879	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 6 * NFSX_UNSIGNED);
3880	*tl++ = txdr_unsigned(type);
3881	*tl = txdr_unsigned(lp->nfsl_seqid);
3882	if (nfstest_outofseq &&
3883	    (arc4random() % nfstest_outofseq) == 0)
3884		*tl = txdr_unsigned(lp->nfsl_seqid + 1);
3885	tl++;
3886	if (NFSHASNFSV4N(nmp))
3887		*tl++ = 0;
3888	else
3889		*tl++ = lp->nfsl_stateid.seqid;
3890	*tl++ = lp->nfsl_stateid.other[0];
3891	*tl++ = lp->nfsl_stateid.other[1];
3892	*tl++ = lp->nfsl_stateid.other[2];
3893	txdr_hyper(off, tl);
3894	tl += 2;
3895	txdr_hyper(len, tl);
3896	if (syscred)
3897		nd->nd_flag |= ND_USEGSSNAME;
3898	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
3899	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3900	NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3901	if (error)
3902		return (error);
3903	if (nd->nd_repstat == 0) {
3904		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3905		lp->nfsl_stateid.seqid = *tl++;
3906		lp->nfsl_stateid.other[0] = *tl++;
3907		lp->nfsl_stateid.other[1] = *tl++;
3908		lp->nfsl_stateid.other[2] = *tl;
3909	} else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3910	    nd->nd_repstat == NFSERR_BADSESSION)
3911		nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3912nfsmout:
3913	mbuf_freem(nd->nd_mrep);
3914	return (error);
3915}
3916
3917/*
3918 * The actual Lock RPC.
3919 */
3920APPLESTATIC int
3921nfsrpc_lock(struct nfsrv_descript *nd, struct nfsmount *nmp, vnode_t vp,
3922    u_int8_t *nfhp, int fhlen, struct nfscllockowner *lp, int newone,
3923    int reclaim, u_int64_t off, u_int64_t len, short type, struct ucred *cred,
3924    NFSPROC_T *p, int syscred)
3925{
3926	u_int32_t *tl;
3927	int error, size;
3928	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3929
3930	nfscl_reqstart(nd, NFSPROC_LOCK, nmp, nfhp, fhlen, NULL, NULL);
3931	NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3932	if (type == F_RDLCK)
3933		*tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3934	else
3935		*tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3936	*tl++ = txdr_unsigned(reclaim);
3937	txdr_hyper(off, tl);
3938	tl += 2;
3939	txdr_hyper(len, tl);
3940	tl += 2;
3941	if (newone) {
3942	    *tl = newnfs_true;
3943	    NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
3944		2 * NFSX_UNSIGNED + NFSX_HYPER);
3945	    *tl++ = txdr_unsigned(lp->nfsl_open->nfso_own->nfsow_seqid);
3946	    if (NFSHASNFSV4N(nmp))
3947		*tl++ = 0;
3948	    else
3949		*tl++ = lp->nfsl_open->nfso_stateid.seqid;
3950	    *tl++ = lp->nfsl_open->nfso_stateid.other[0];
3951	    *tl++ = lp->nfsl_open->nfso_stateid.other[1];
3952	    *tl++ = lp->nfsl_open->nfso_stateid.other[2];
3953	    *tl++ = txdr_unsigned(lp->nfsl_seqid);
3954	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3955	    *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3956	    NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
3957	    NFSBCOPY(nfhp, &own[NFSV4CL_LOCKNAMELEN], fhlen);
3958	    (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
3959	} else {
3960	    *tl = newnfs_false;
3961	    NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + NFSX_UNSIGNED);
3962	    if (NFSHASNFSV4N(nmp))
3963		*tl++ = 0;
3964	    else
3965		*tl++ = lp->nfsl_stateid.seqid;
3966	    *tl++ = lp->nfsl_stateid.other[0];
3967	    *tl++ = lp->nfsl_stateid.other[1];
3968	    *tl++ = lp->nfsl_stateid.other[2];
3969	    *tl = txdr_unsigned(lp->nfsl_seqid);
3970	    if (nfstest_outofseq &&
3971		(arc4random() % nfstest_outofseq) == 0)
3972		    *tl = txdr_unsigned(lp->nfsl_seqid + 1);
3973	}
3974	if (syscred)
3975		nd->nd_flag |= ND_USEGSSNAME;
3976	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
3977	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3978	if (error)
3979		return (error);
3980	if (newone)
3981	    NFSCL_INCRSEQID(lp->nfsl_open->nfso_own->nfsow_seqid, nd);
3982	NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3983	if (nd->nd_repstat == 0) {
3984		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3985		lp->nfsl_stateid.seqid = *tl++;
3986		lp->nfsl_stateid.other[0] = *tl++;
3987		lp->nfsl_stateid.other[1] = *tl++;
3988		lp->nfsl_stateid.other[2] = *tl;
3989	} else if (nd->nd_repstat == NFSERR_DENIED) {
3990		NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3991		size = fxdr_unsigned(int, *(tl + 7));
3992		if (size < 0 || size > NFSV4_OPAQUELIMIT)
3993			error = EBADRPC;
3994		if (!error)
3995			error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3996	} else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3997	    nd->nd_repstat == NFSERR_BADSESSION)
3998		nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3999nfsmout:
4000	mbuf_freem(nd->nd_mrep);
4001	return (error);
4002}
4003
4004/*
4005 * nfs statfs rpc
4006 * (always called with the vp for the mount point)
4007 */
4008APPLESTATIC int
4009nfsrpc_statfs(vnode_t vp, struct nfsstatfs *sbp, struct nfsfsinfo *fsp,
4010    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4011    void *stuff)
4012{
4013	u_int32_t *tl = NULL;
4014	struct nfsrv_descript nfsd, *nd = &nfsd;
4015	struct nfsmount *nmp;
4016	nfsattrbit_t attrbits;
4017	int error;
4018
4019	*attrflagp = 0;
4020	nmp = VFSTONFS(vnode_mount(vp));
4021	if (NFSHASNFSV4(nmp)) {
4022		/*
4023		 * For V4, you actually do a getattr.
4024		 */
4025		NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4026		NFSSTATFS_GETATTRBIT(&attrbits);
4027		(void) nfsrv_putattrbit(nd, &attrbits);
4028		nd->nd_flag |= ND_USEGSSNAME;
4029		error = nfscl_request(nd, vp, p, cred, stuff);
4030		if (error)
4031			return (error);
4032		if (nd->nd_repstat == 0) {
4033			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4034			    NULL, NULL, sbp, fsp, NULL, 0, NULL, NULL, NULL, p,
4035			    cred);
4036			if (!error) {
4037				nmp->nm_fsid[0] = nap->na_filesid[0];
4038				nmp->nm_fsid[1] = nap->na_filesid[1];
4039				NFSSETHASSETFSID(nmp);
4040				*attrflagp = 1;
4041			}
4042		} else {
4043			error = nd->nd_repstat;
4044		}
4045		if (error)
4046			goto nfsmout;
4047	} else {
4048		NFSCL_REQSTART(nd, NFSPROC_FSSTAT, vp);
4049		error = nfscl_request(nd, vp, p, cred, stuff);
4050		if (error)
4051			return (error);
4052		if (nd->nd_flag & ND_NFSV3) {
4053			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4054			if (error)
4055				goto nfsmout;
4056		}
4057		if (nd->nd_repstat) {
4058			error = nd->nd_repstat;
4059			goto nfsmout;
4060		}
4061		NFSM_DISSECT(tl, u_int32_t *,
4062		    NFSX_STATFS(nd->nd_flag & ND_NFSV3));
4063	}
4064	if (NFSHASNFSV3(nmp)) {
4065		sbp->sf_tbytes = fxdr_hyper(tl); tl += 2;
4066		sbp->sf_fbytes = fxdr_hyper(tl); tl += 2;
4067		sbp->sf_abytes = fxdr_hyper(tl); tl += 2;
4068		sbp->sf_tfiles = fxdr_hyper(tl); tl += 2;
4069		sbp->sf_ffiles = fxdr_hyper(tl); tl += 2;
4070		sbp->sf_afiles = fxdr_hyper(tl); tl += 2;
4071		sbp->sf_invarsec = fxdr_unsigned(u_int32_t, *tl);
4072	} else if (NFSHASNFSV4(nmp) == 0) {
4073		sbp->sf_tsize = fxdr_unsigned(u_int32_t, *tl++);
4074		sbp->sf_bsize = fxdr_unsigned(u_int32_t, *tl++);
4075		sbp->sf_blocks = fxdr_unsigned(u_int32_t, *tl++);
4076		sbp->sf_bfree = fxdr_unsigned(u_int32_t, *tl++);
4077		sbp->sf_bavail = fxdr_unsigned(u_int32_t, *tl);
4078	}
4079nfsmout:
4080	mbuf_freem(nd->nd_mrep);
4081	return (error);
4082}
4083
4084/*
4085 * nfs pathconf rpc
4086 */
4087APPLESTATIC int
4088nfsrpc_pathconf(vnode_t vp, struct nfsv3_pathconf *pc,
4089    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4090    void *stuff)
4091{
4092	struct nfsrv_descript nfsd, *nd = &nfsd;
4093	struct nfsmount *nmp;
4094	u_int32_t *tl;
4095	nfsattrbit_t attrbits;
4096	int error;
4097
4098	*attrflagp = 0;
4099	nmp = VFSTONFS(vnode_mount(vp));
4100	if (NFSHASNFSV4(nmp)) {
4101		/*
4102		 * For V4, you actually do a getattr.
4103		 */
4104		NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4105		NFSPATHCONF_GETATTRBIT(&attrbits);
4106		(void) nfsrv_putattrbit(nd, &attrbits);
4107		nd->nd_flag |= ND_USEGSSNAME;
4108		error = nfscl_request(nd, vp, p, cred, stuff);
4109		if (error)
4110			return (error);
4111		if (nd->nd_repstat == 0) {
4112			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4113			    pc, NULL, NULL, NULL, NULL, 0, NULL, NULL, NULL, p,
4114			    cred);
4115			if (!error)
4116				*attrflagp = 1;
4117		} else {
4118			error = nd->nd_repstat;
4119		}
4120	} else {
4121		NFSCL_REQSTART(nd, NFSPROC_PATHCONF, vp);
4122		error = nfscl_request(nd, vp, p, cred, stuff);
4123		if (error)
4124			return (error);
4125		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4126		if (nd->nd_repstat && !error)
4127			error = nd->nd_repstat;
4128		if (!error) {
4129			NFSM_DISSECT(tl, u_int32_t *, NFSX_V3PATHCONF);
4130			pc->pc_linkmax = fxdr_unsigned(u_int32_t, *tl++);
4131			pc->pc_namemax = fxdr_unsigned(u_int32_t, *tl++);
4132			pc->pc_notrunc = fxdr_unsigned(u_int32_t, *tl++);
4133			pc->pc_chownrestricted =
4134			    fxdr_unsigned(u_int32_t, *tl++);
4135			pc->pc_caseinsensitive =
4136			    fxdr_unsigned(u_int32_t, *tl++);
4137			pc->pc_casepreserving = fxdr_unsigned(u_int32_t, *tl);
4138		}
4139	}
4140nfsmout:
4141	mbuf_freem(nd->nd_mrep);
4142	return (error);
4143}
4144
4145/*
4146 * nfs version 3 fsinfo rpc call
4147 */
4148APPLESTATIC int
4149nfsrpc_fsinfo(vnode_t vp, struct nfsfsinfo *fsp, struct ucred *cred,
4150    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
4151{
4152	u_int32_t *tl;
4153	struct nfsrv_descript nfsd, *nd = &nfsd;
4154	int error;
4155
4156	*attrflagp = 0;
4157	NFSCL_REQSTART(nd, NFSPROC_FSINFO, vp);
4158	error = nfscl_request(nd, vp, p, cred, stuff);
4159	if (error)
4160		return (error);
4161	error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4162	if (nd->nd_repstat && !error)
4163		error = nd->nd_repstat;
4164	if (!error) {
4165		NFSM_DISSECT(tl, u_int32_t *, NFSX_V3FSINFO);
4166		fsp->fs_rtmax = fxdr_unsigned(u_int32_t, *tl++);
4167		fsp->fs_rtpref = fxdr_unsigned(u_int32_t, *tl++);
4168		fsp->fs_rtmult = fxdr_unsigned(u_int32_t, *tl++);
4169		fsp->fs_wtmax = fxdr_unsigned(u_int32_t, *tl++);
4170		fsp->fs_wtpref = fxdr_unsigned(u_int32_t, *tl++);
4171		fsp->fs_wtmult = fxdr_unsigned(u_int32_t, *tl++);
4172		fsp->fs_dtpref = fxdr_unsigned(u_int32_t, *tl++);
4173		fsp->fs_maxfilesize = fxdr_hyper(tl);
4174		tl += 2;
4175		fxdr_nfsv3time(tl, &fsp->fs_timedelta);
4176		tl += 2;
4177		fsp->fs_properties = fxdr_unsigned(u_int32_t, *tl);
4178	}
4179nfsmout:
4180	mbuf_freem(nd->nd_mrep);
4181	return (error);
4182}
4183
4184/*
4185 * This function performs the Renew RPC.
4186 */
4187APPLESTATIC int
4188nfsrpc_renew(struct nfsclclient *clp, struct nfsclds *dsp, struct ucred *cred,
4189    NFSPROC_T *p)
4190{
4191	u_int32_t *tl;
4192	struct nfsrv_descript nfsd;
4193	struct nfsrv_descript *nd = &nfsd;
4194	struct nfsmount *nmp;
4195	int error;
4196	struct nfssockreq *nrp;
4197
4198	nmp = clp->nfsc_nmp;
4199	if (nmp == NULL)
4200		return (0);
4201	nfscl_reqstart(nd, NFSPROC_RENEW, nmp, NULL, 0, NULL,
4202	    &dsp->nfsclds_sess);
4203	if (!NFSHASNFSV4N(nmp)) {
4204		/* NFSv4.1 just uses a Sequence Op and not a Renew. */
4205		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4206		*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4207		*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4208	}
4209	nrp = dsp->nfsclds_sockp;
4210	if (nrp == NULL)
4211		/* If NULL, use the MDS socket. */
4212		nrp = &nmp->nm_sockreq;
4213	nd->nd_flag |= ND_USEGSSNAME;
4214	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4215	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
4216	if (error)
4217		return (error);
4218	error = nd->nd_repstat;
4219	mbuf_freem(nd->nd_mrep);
4220	return (error);
4221}
4222
4223/*
4224 * This function performs the Releaselockowner RPC.
4225 */
4226APPLESTATIC int
4227nfsrpc_rellockown(struct nfsmount *nmp, struct nfscllockowner *lp,
4228    uint8_t *fh, int fhlen, struct ucred *cred, NFSPROC_T *p)
4229{
4230	struct nfsrv_descript nfsd, *nd = &nfsd;
4231	u_int32_t *tl;
4232	int error;
4233	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
4234
4235	if (NFSHASNFSV4N(nmp)) {
4236		/* For NFSv4.1, do a FreeStateID. */
4237		nfscl_reqstart(nd, NFSPROC_FREESTATEID, nmp, NULL, 0, NULL,
4238		    NULL);
4239		nfsm_stateidtom(nd, &lp->nfsl_stateid, NFSSTATEID_PUTSTATEID);
4240	} else {
4241		nfscl_reqstart(nd, NFSPROC_RELEASELCKOWN, nmp, NULL, 0, NULL,
4242		    NULL);
4243		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4244		*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4245		*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4246		NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
4247		NFSBCOPY(fh, &own[NFSV4CL_LOCKNAMELEN], fhlen);
4248		(void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
4249	}
4250	nd->nd_flag |= ND_USEGSSNAME;
4251	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4252	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4253	if (error)
4254		return (error);
4255	error = nd->nd_repstat;
4256	mbuf_freem(nd->nd_mrep);
4257	return (error);
4258}
4259
4260/*
4261 * This function performs the Compound to get the mount pt FH.
4262 */
4263APPLESTATIC int
4264nfsrpc_getdirpath(struct nfsmount *nmp, u_char *dirpath, struct ucred *cred,
4265    NFSPROC_T *p)
4266{
4267	u_int32_t *tl;
4268	struct nfsrv_descript nfsd;
4269	struct nfsrv_descript *nd = &nfsd;
4270	u_char *cp, *cp2;
4271	int error, cnt, len, setnil;
4272	u_int32_t *opcntp;
4273
4274	nfscl_reqstart(nd, NFSPROC_PUTROOTFH, nmp, NULL, 0, &opcntp, NULL);
4275	cp = dirpath;
4276	cnt = 0;
4277	do {
4278		setnil = 0;
4279		while (*cp == '/')
4280			cp++;
4281		cp2 = cp;
4282		while (*cp2 != '\0' && *cp2 != '/')
4283			cp2++;
4284		if (*cp2 == '/') {
4285			setnil = 1;
4286			*cp2 = '\0';
4287		}
4288		if (cp2 != cp) {
4289			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4290			*tl = txdr_unsigned(NFSV4OP_LOOKUP);
4291			nfsm_strtom(nd, cp, strlen(cp));
4292			cnt++;
4293		}
4294		if (setnil)
4295			*cp2++ = '/';
4296		cp = cp2;
4297	} while (*cp != '\0');
4298	if (NFSHASNFSV4N(nmp))
4299		/* Has a Sequence Op done by nfscl_reqstart(). */
4300		*opcntp = txdr_unsigned(3 + cnt);
4301	else
4302		*opcntp = txdr_unsigned(2 + cnt);
4303	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4304	*tl = txdr_unsigned(NFSV4OP_GETFH);
4305	nd->nd_flag |= ND_USEGSSNAME;
4306	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4307		NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4308	if (error)
4309		return (error);
4310	if (nd->nd_repstat == 0) {
4311		NFSM_DISSECT(tl, u_int32_t *, (3 + 2 * cnt) * NFSX_UNSIGNED);
4312		tl += (2 + 2 * cnt);
4313		if ((len = fxdr_unsigned(int, *tl)) <= 0 ||
4314			len > NFSX_FHMAX) {
4315			nd->nd_repstat = NFSERR_BADXDR;
4316		} else {
4317			nd->nd_repstat = nfsrv_mtostr(nd, nmp->nm_fh, len);
4318			if (nd->nd_repstat == 0)
4319				nmp->nm_fhsize = len;
4320		}
4321	}
4322	error = nd->nd_repstat;
4323nfsmout:
4324	mbuf_freem(nd->nd_mrep);
4325	return (error);
4326}
4327
4328/*
4329 * This function performs the Delegreturn RPC.
4330 */
4331APPLESTATIC int
4332nfsrpc_delegreturn(struct nfscldeleg *dp, struct ucred *cred,
4333    struct nfsmount *nmp, NFSPROC_T *p, int syscred)
4334{
4335	u_int32_t *tl;
4336	struct nfsrv_descript nfsd;
4337	struct nfsrv_descript *nd = &nfsd;
4338	int error;
4339
4340	nfscl_reqstart(nd, NFSPROC_DELEGRETURN, nmp, dp->nfsdl_fh,
4341	    dp->nfsdl_fhlen, NULL, NULL);
4342	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
4343	if (NFSHASNFSV4N(nmp))
4344		*tl++ = 0;
4345	else
4346		*tl++ = dp->nfsdl_stateid.seqid;
4347	*tl++ = dp->nfsdl_stateid.other[0];
4348	*tl++ = dp->nfsdl_stateid.other[1];
4349	*tl = dp->nfsdl_stateid.other[2];
4350	if (syscred)
4351		nd->nd_flag |= ND_USEGSSNAME;
4352	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4353	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4354	if (error)
4355		return (error);
4356	error = nd->nd_repstat;
4357	mbuf_freem(nd->nd_mrep);
4358	return (error);
4359}
4360
4361/*
4362 * nfs getacl call.
4363 */
4364APPLESTATIC int
4365nfsrpc_getacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4366    struct acl *aclp, void *stuff)
4367{
4368	struct nfsrv_descript nfsd, *nd = &nfsd;
4369	int error;
4370	nfsattrbit_t attrbits;
4371	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4372
4373	if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4374		return (EOPNOTSUPP);
4375	NFSCL_REQSTART(nd, NFSPROC_GETACL, vp);
4376	NFSZERO_ATTRBIT(&attrbits);
4377	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4378	(void) nfsrv_putattrbit(nd, &attrbits);
4379	error = nfscl_request(nd, vp, p, cred, stuff);
4380	if (error)
4381		return (error);
4382	if (!nd->nd_repstat)
4383		error = nfsv4_loadattr(nd, vp, NULL, NULL, NULL, 0, NULL,
4384		    NULL, NULL, NULL, aclp, 0, NULL, NULL, NULL, p, cred);
4385	else
4386		error = nd->nd_repstat;
4387	mbuf_freem(nd->nd_mrep);
4388	return (error);
4389}
4390
4391/*
4392 * nfs setacl call.
4393 */
4394APPLESTATIC int
4395nfsrpc_setacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4396    struct acl *aclp, void *stuff)
4397{
4398	int error;
4399	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4400
4401	if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4402		return (EOPNOTSUPP);
4403	error = nfsrpc_setattr(vp, NULL, aclp, cred, p, NULL, NULL, stuff);
4404	return (error);
4405}
4406
4407/*
4408 * nfs setacl call.
4409 */
4410static int
4411nfsrpc_setaclrpc(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4412    struct acl *aclp, nfsv4stateid_t *stateidp, void *stuff)
4413{
4414	struct nfsrv_descript nfsd, *nd = &nfsd;
4415	int error;
4416	nfsattrbit_t attrbits;
4417	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4418
4419	if (!NFSHASNFSV4(nmp))
4420		return (EOPNOTSUPP);
4421	NFSCL_REQSTART(nd, NFSPROC_SETACL, vp);
4422	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
4423	NFSZERO_ATTRBIT(&attrbits);
4424	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4425	(void) nfsv4_fillattr(nd, vnode_mount(vp), vp, aclp, NULL, NULL, 0,
4426	    &attrbits, NULL, NULL, 0, 0, 0, 0, (uint64_t)0);
4427	error = nfscl_request(nd, vp, p, cred, stuff);
4428	if (error)
4429		return (error);
4430	/* Don't care about the pre/postop attributes */
4431	mbuf_freem(nd->nd_mrep);
4432	return (nd->nd_repstat);
4433}
4434
4435/*
4436 * Do the NFSv4.1 Exchange ID.
4437 */
4438int
4439nfsrpc_exchangeid(struct nfsmount *nmp, struct nfsclclient *clp,
4440    struct nfssockreq *nrp, uint32_t exchflags, struct nfsclds **dspp,
4441    struct ucred *cred, NFSPROC_T *p)
4442{
4443	uint32_t *tl, v41flags;
4444	struct nfsrv_descript nfsd;
4445	struct nfsrv_descript *nd = &nfsd;
4446	struct nfsclds *dsp;
4447	struct timespec verstime;
4448	int error, len;
4449
4450	*dspp = NULL;
4451	nfscl_reqstart(nd, NFSPROC_EXCHANGEID, nmp, NULL, 0, NULL, NULL);
4452	NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4453	*tl++ = txdr_unsigned(nfsboottime.tv_sec);	/* Client owner */
4454	*tl = txdr_unsigned(clp->nfsc_rev);
4455	(void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
4456
4457	NFSM_BUILD(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4458	*tl++ = txdr_unsigned(exchflags);
4459	*tl++ = txdr_unsigned(NFSV4EXCH_SP4NONE);
4460
4461	/* Set the implementation id4 */
4462	*tl = txdr_unsigned(1);
4463	(void) nfsm_strtom(nd, "freebsd.org", strlen("freebsd.org"));
4464	(void) nfsm_strtom(nd, version, strlen(version));
4465	NFSM_BUILD(tl, uint32_t *, NFSX_V4TIME);
4466	verstime.tv_sec = 1293840000;		/* Jan 1, 2011 */
4467	verstime.tv_nsec = 0;
4468	txdr_nfsv4time(&verstime, tl);
4469	nd->nd_flag |= ND_USEGSSNAME;
4470	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4471	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4472	NFSCL_DEBUG(1, "exchangeid err=%d reps=%d\n", error,
4473	    (int)nd->nd_repstat);
4474	if (error != 0)
4475		return (error);
4476	if (nd->nd_repstat == 0) {
4477		NFSM_DISSECT(tl, uint32_t *, 6 * NFSX_UNSIGNED + NFSX_HYPER);
4478		len = fxdr_unsigned(int, *(tl + 7));
4479		if (len < 0 || len > NFSV4_OPAQUELIMIT) {
4480			error = NFSERR_BADXDR;
4481			goto nfsmout;
4482		}
4483		dsp = malloc(sizeof(struct nfsclds) + len, M_NFSCLDS,
4484		    M_WAITOK | M_ZERO);
4485		dsp->nfsclds_expire = NFSD_MONOSEC + clp->nfsc_renew;
4486		dsp->nfsclds_servownlen = len;
4487		dsp->nfsclds_sess.nfsess_clientid.lval[0] = *tl++;
4488		dsp->nfsclds_sess.nfsess_clientid.lval[1] = *tl++;
4489		dsp->nfsclds_sess.nfsess_sequenceid =
4490		    fxdr_unsigned(uint32_t, *tl++);
4491		v41flags = fxdr_unsigned(uint32_t, *tl);
4492		if ((v41flags & NFSV4EXCH_USEPNFSMDS) != 0 &&
4493		    NFSHASPNFSOPT(nmp)) {
4494			NFSCL_DEBUG(1, "set PNFS\n");
4495			NFSLOCKMNT(nmp);
4496			nmp->nm_state |= NFSSTA_PNFS;
4497			NFSUNLOCKMNT(nmp);
4498			dsp->nfsclds_flags |= NFSCLDS_MDS;
4499		}
4500		if ((v41flags & NFSV4EXCH_USEPNFSDS) != 0)
4501			dsp->nfsclds_flags |= NFSCLDS_DS;
4502		if (len > 0)
4503			nd->nd_repstat = nfsrv_mtostr(nd,
4504			    dsp->nfsclds_serverown, len);
4505		if (nd->nd_repstat == 0) {
4506			mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
4507			mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession",
4508			    NULL, MTX_DEF);
4509			nfscl_initsessionslots(&dsp->nfsclds_sess);
4510			*dspp = dsp;
4511		} else
4512			free(dsp, M_NFSCLDS);
4513	}
4514	error = nd->nd_repstat;
4515nfsmout:
4516	mbuf_freem(nd->nd_mrep);
4517	return (error);
4518}
4519
4520/*
4521 * Do the NFSv4.1 Create Session.
4522 */
4523int
4524nfsrpc_createsession(struct nfsmount *nmp, struct nfsclsession *sep,
4525    struct nfssockreq *nrp, uint32_t sequenceid, int mds, struct ucred *cred,
4526    NFSPROC_T *p)
4527{
4528	uint32_t crflags, *tl;
4529	struct nfsrv_descript nfsd;
4530	struct nfsrv_descript *nd = &nfsd;
4531	int error, irdcnt;
4532
4533	nfscl_reqstart(nd, NFSPROC_CREATESESSION, nmp, NULL, 0, NULL, NULL);
4534	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
4535	*tl++ = sep->nfsess_clientid.lval[0];
4536	*tl++ = sep->nfsess_clientid.lval[1];
4537	*tl++ = txdr_unsigned(sequenceid);
4538	crflags = (NFSMNT_RDONLY(nmp->nm_mountp) ? 0 : NFSV4CRSESS_PERSIST);
4539	if (nfscl_enablecallb != 0 && nfs_numnfscbd > 0)
4540		crflags |= NFSV4CRSESS_CONNBACKCHAN;
4541	*tl = txdr_unsigned(crflags);
4542
4543	/* Fill in fore channel attributes. */
4544	NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4545	*tl++ = 0;				/* Header pad size */
4546	*tl++ = txdr_unsigned(100000);		/* Max request size */
4547	*tl++ = txdr_unsigned(100000);		/* Max response size */
4548	*tl++ = txdr_unsigned(4096);		/* Max response size cached */
4549	*tl++ = txdr_unsigned(20);		/* Max operations */
4550	*tl++ = txdr_unsigned(64);		/* Max slots */
4551	*tl = 0;				/* No rdma ird */
4552
4553	/* Fill in back channel attributes. */
4554	NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4555	*tl++ = 0;				/* Header pad size */
4556	*tl++ = txdr_unsigned(10000);		/* Max request size */
4557	*tl++ = txdr_unsigned(10000);		/* Max response size */
4558	*tl++ = txdr_unsigned(4096);		/* Max response size cached */
4559	*tl++ = txdr_unsigned(4);		/* Max operations */
4560	*tl++ = txdr_unsigned(NFSV4_CBSLOTS);	/* Max slots */
4561	*tl = 0;				/* No rdma ird */
4562
4563	NFSM_BUILD(tl, uint32_t *, 8 * NFSX_UNSIGNED);
4564	*tl++ = txdr_unsigned(NFS_CALLBCKPROG);	/* Call back prog # */
4565
4566	/* Allow AUTH_SYS callbacks as uid, gid == 0. */
4567	*tl++ = txdr_unsigned(1);		/* Auth_sys only */
4568	*tl++ = txdr_unsigned(AUTH_SYS);	/* AUTH_SYS type */
4569	*tl++ = txdr_unsigned(nfsboottime.tv_sec); /* time stamp */
4570	*tl++ = 0;				/* Null machine name */
4571	*tl++ = 0;				/* Uid == 0 */
4572	*tl++ = 0;				/* Gid == 0 */
4573	*tl = 0;				/* No additional gids */
4574	nd->nd_flag |= ND_USEGSSNAME;
4575	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred, NFS_PROG,
4576	    NFS_VER4, NULL, 1, NULL, NULL);
4577	if (error != 0)
4578		return (error);
4579	if (nd->nd_repstat == 0) {
4580		NFSM_DISSECT(tl, uint32_t *, NFSX_V4SESSIONID +
4581		    2 * NFSX_UNSIGNED);
4582		bcopy(tl, sep->nfsess_sessionid, NFSX_V4SESSIONID);
4583		tl += NFSX_V4SESSIONID / NFSX_UNSIGNED;
4584		sep->nfsess_sequenceid = fxdr_unsigned(uint32_t, *tl++);
4585		crflags = fxdr_unsigned(uint32_t, *tl);
4586		if ((crflags & NFSV4CRSESS_PERSIST) != 0 && mds != 0) {
4587			NFSLOCKMNT(nmp);
4588			nmp->nm_state |= NFSSTA_SESSPERSIST;
4589			NFSUNLOCKMNT(nmp);
4590		}
4591
4592		/* Get the fore channel slot count. */
4593		NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4594		tl += 3;		/* Skip the other counts. */
4595		sep->nfsess_maxcache = fxdr_unsigned(int, *tl++);
4596		tl++;
4597		sep->nfsess_foreslots = fxdr_unsigned(uint16_t, *tl++);
4598		NFSCL_DEBUG(4, "fore slots=%d\n", (int)sep->nfsess_foreslots);
4599		irdcnt = fxdr_unsigned(int, *tl);
4600		if (irdcnt > 0)
4601			NFSM_DISSECT(tl, uint32_t *, irdcnt * NFSX_UNSIGNED);
4602
4603		/* and the back channel slot count. */
4604		NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4605		tl += 5;
4606		sep->nfsess_backslots = fxdr_unsigned(uint16_t, *tl);
4607		NFSCL_DEBUG(4, "back slots=%d\n", (int)sep->nfsess_backslots);
4608	}
4609	error = nd->nd_repstat;
4610nfsmout:
4611	mbuf_freem(nd->nd_mrep);
4612	return (error);
4613}
4614
4615/*
4616 * Do the NFSv4.1 Destroy Session.
4617 */
4618int
4619nfsrpc_destroysession(struct nfsmount *nmp, struct nfsclclient *clp,
4620    struct ucred *cred, NFSPROC_T *p)
4621{
4622	uint32_t *tl;
4623	struct nfsrv_descript nfsd;
4624	struct nfsrv_descript *nd = &nfsd;
4625	int error;
4626
4627	nfscl_reqstart(nd, NFSPROC_DESTROYSESSION, nmp, NULL, 0, NULL, NULL);
4628	NFSM_BUILD(tl, uint32_t *, NFSX_V4SESSIONID);
4629	bcopy(NFSMNT_MDSSESSION(nmp)->nfsess_sessionid, tl, NFSX_V4SESSIONID);
4630	nd->nd_flag |= ND_USEGSSNAME;
4631	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4632	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4633	if (error != 0)
4634		return (error);
4635	error = nd->nd_repstat;
4636	mbuf_freem(nd->nd_mrep);
4637	return (error);
4638}
4639
4640/*
4641 * Do the NFSv4.1 Destroy Client.
4642 */
4643int
4644nfsrpc_destroyclient(struct nfsmount *nmp, struct nfsclclient *clp,
4645    struct ucred *cred, NFSPROC_T *p)
4646{
4647	uint32_t *tl;
4648	struct nfsrv_descript nfsd;
4649	struct nfsrv_descript *nd = &nfsd;
4650	int error;
4651
4652	nfscl_reqstart(nd, NFSPROC_DESTROYCLIENT, nmp, NULL, 0, NULL, NULL);
4653	NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4654	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4655	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4656	nd->nd_flag |= ND_USEGSSNAME;
4657	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4658	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4659	if (error != 0)
4660		return (error);
4661	error = nd->nd_repstat;
4662	mbuf_freem(nd->nd_mrep);
4663	return (error);
4664}
4665
4666/*
4667 * Do the NFSv4.1 LayoutGet.
4668 */
4669int
4670nfsrpc_layoutget(struct nfsmount *nmp, uint8_t *fhp, int fhlen, int iomode,
4671    uint64_t offset, uint64_t len, uint64_t minlen, int layoutlen,
4672    nfsv4stateid_t *stateidp, int *retonclosep, struct nfsclflayouthead *flhp,
4673    struct ucred *cred, NFSPROC_T *p, void *stuff)
4674{
4675	uint32_t *tl;
4676	struct nfsrv_descript nfsd, *nd = &nfsd;
4677	struct nfsfh *nfhp;
4678	struct nfsclflayout *flp, *prevflp, *tflp;
4679	int cnt, error, gotiomode, fhcnt, nfhlen, i, j;
4680	uint8_t *cp;
4681	uint64_t retlen;
4682
4683	flp = NULL;
4684	gotiomode = -1;
4685	nfscl_reqstart(nd, NFSPROC_LAYOUTGET, nmp, fhp, fhlen, NULL, NULL);
4686	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4687	    NFSX_STATEID);
4688	*tl++ = newnfs_false;		/* Don't signal availability. */
4689	*tl++ = txdr_unsigned(NFSLAYOUT_NFSV4_1_FILES);
4690	*tl++ = txdr_unsigned(iomode);
4691	txdr_hyper(offset, tl);
4692	tl += 2;
4693	txdr_hyper(len, tl);
4694	tl += 2;
4695	txdr_hyper(minlen, tl);
4696	tl += 2;
4697	*tl++ = txdr_unsigned(stateidp->seqid);
4698	NFSCL_DEBUG(4, "layget seq=%d\n", (int)stateidp->seqid);
4699	*tl++ = stateidp->other[0];
4700	*tl++ = stateidp->other[1];
4701	*tl++ = stateidp->other[2];
4702	*tl = txdr_unsigned(layoutlen);
4703	nd->nd_flag |= ND_USEGSSNAME;
4704	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4705	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4706	if (error != 0)
4707		return (error);
4708	if (nd->nd_repstat == 0) {
4709		NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_STATEID);
4710		if (*tl++ != 0)
4711			*retonclosep = 1;
4712		else
4713			*retonclosep = 0;
4714		stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
4715		NFSCL_DEBUG(4, "retoncls=%d stseq=%d\n", *retonclosep,
4716		    (int)stateidp->seqid);
4717		stateidp->other[0] = *tl++;
4718		stateidp->other[1] = *tl++;
4719		stateidp->other[2] = *tl++;
4720		cnt = fxdr_unsigned(int, *tl);
4721		NFSCL_DEBUG(4, "layg cnt=%d\n", cnt);
4722		if (cnt <= 0 || cnt > 10000) {
4723			/* Don't accept more than 10000 layouts in reply. */
4724			error = NFSERR_BADXDR;
4725			goto nfsmout;
4726		}
4727		for (i = 0; i < cnt; i++) {
4728			/* Dissect all the way to the file handle cnt. */
4729			NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_HYPER +
4730			    6 * NFSX_UNSIGNED + NFSX_V4DEVICEID);
4731			fhcnt = fxdr_unsigned(int, *(tl + 11 +
4732			    NFSX_V4DEVICEID / NFSX_UNSIGNED));
4733			NFSCL_DEBUG(4, "fhcnt=%d\n", fhcnt);
4734			if (fhcnt < 0 || fhcnt > 100) {
4735				/* Don't accept more than 100 file handles. */
4736				error = NFSERR_BADXDR;
4737				goto nfsmout;
4738			}
4739			if (fhcnt > 1)
4740				flp = malloc(sizeof(*flp) + (fhcnt - 1) *
4741				    sizeof(struct nfsfh *),
4742				    M_NFSFLAYOUT, M_WAITOK);
4743			else
4744				flp = malloc(sizeof(*flp),
4745				    M_NFSFLAYOUT, M_WAITOK);
4746			flp->nfsfl_flags = 0;
4747			flp->nfsfl_fhcnt = 0;
4748			flp->nfsfl_devp = NULL;
4749			flp->nfsfl_off = fxdr_hyper(tl); tl += 2;
4750			retlen = fxdr_hyper(tl); tl += 2;
4751			if (flp->nfsfl_off + retlen < flp->nfsfl_off)
4752				flp->nfsfl_end = UINT64_MAX - flp->nfsfl_off;
4753			else
4754				flp->nfsfl_end = flp->nfsfl_off + retlen;
4755			flp->nfsfl_iomode = fxdr_unsigned(int, *tl++);
4756			if (gotiomode == -1)
4757				gotiomode = flp->nfsfl_iomode;
4758			NFSCL_DEBUG(4, "layg reqiom=%d retiom=%d\n", iomode,
4759			    (int)flp->nfsfl_iomode);
4760			if (fxdr_unsigned(int, *tl++) !=
4761			    NFSLAYOUT_NFSV4_1_FILES) {
4762				printf("NFSv4.1: got non-files layout\n");
4763				error = NFSERR_BADXDR;
4764				goto nfsmout;
4765			}
4766			NFSBCOPY(++tl, flp->nfsfl_dev, NFSX_V4DEVICEID);
4767			tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4768			flp->nfsfl_util = fxdr_unsigned(uint32_t, *tl++);
4769			NFSCL_DEBUG(4, "flutil=0x%x\n", flp->nfsfl_util);
4770			flp->nfsfl_stripe1 = fxdr_unsigned(uint32_t, *tl++);
4771			flp->nfsfl_patoff = fxdr_hyper(tl); tl += 2;
4772			if (fxdr_unsigned(int, *tl) != fhcnt) {
4773				printf("EEK! bad fhcnt\n");
4774				error = NFSERR_BADXDR;
4775				goto nfsmout;
4776			}
4777			for (j = 0; j < fhcnt; j++) {
4778				NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4779				nfhlen = fxdr_unsigned(int, *tl);
4780				if (nfhlen <= 0 || nfhlen > NFSX_V4FHMAX) {
4781					error = NFSERR_BADXDR;
4782					goto nfsmout;
4783				}
4784				nfhp = malloc(sizeof(*nfhp) + nfhlen - 1,
4785				    M_NFSFH, M_WAITOK);
4786				flp->nfsfl_fh[j] = nfhp;
4787				flp->nfsfl_fhcnt++;
4788				nfhp->nfh_len = nfhlen;
4789				NFSM_DISSECT(cp, uint8_t *, NFSM_RNDUP(nfhlen));
4790				NFSBCOPY(cp, nfhp->nfh_fh, nfhlen);
4791			}
4792			if (flp->nfsfl_iomode == gotiomode) {
4793				/* Keep the list in increasing offset order. */
4794				tflp = LIST_FIRST(flhp);
4795				prevflp = NULL;
4796				while (tflp != NULL &&
4797				    tflp->nfsfl_off < flp->nfsfl_off) {
4798					prevflp = tflp;
4799					tflp = LIST_NEXT(tflp, nfsfl_list);
4800				}
4801				if (prevflp == NULL)
4802					LIST_INSERT_HEAD(flhp, flp, nfsfl_list);
4803				else
4804					LIST_INSERT_AFTER(prevflp, flp,
4805					    nfsfl_list);
4806			} else {
4807				printf("nfscl_layoutget(): got wrong iomode\n");
4808				nfscl_freeflayout(flp);
4809			}
4810			flp = NULL;
4811		}
4812	}
4813	if (nd->nd_repstat != 0 && error == 0)
4814		error = nd->nd_repstat;
4815nfsmout:
4816	if (error != 0 && flp != NULL)
4817		nfscl_freeflayout(flp);
4818	mbuf_freem(nd->nd_mrep);
4819	return (error);
4820}
4821
4822/*
4823 * Do the NFSv4.1 Get Device Info.
4824 */
4825int
4826nfsrpc_getdeviceinfo(struct nfsmount *nmp, uint8_t *deviceid, int layouttype,
4827    uint32_t *notifybitsp, struct nfscldevinfo **ndip, struct ucred *cred,
4828    NFSPROC_T *p)
4829{
4830	uint32_t cnt, *tl;
4831	struct nfsrv_descript nfsd;
4832	struct nfsrv_descript *nd = &nfsd;
4833	struct sockaddr_storage ss;
4834	struct nfsclds *dsp = NULL, **dspp;
4835	struct nfscldevinfo *ndi;
4836	int addrcnt, bitcnt, error, i, isudp, j, pos, safilled, stripecnt;
4837	uint8_t stripeindex;
4838
4839	*ndip = NULL;
4840	ndi = NULL;
4841	nfscl_reqstart(nd, NFSPROC_GETDEVICEINFO, nmp, NULL, 0, NULL, NULL);
4842	NFSM_BUILD(tl, uint32_t *, NFSX_V4DEVICEID + 3 * NFSX_UNSIGNED);
4843	NFSBCOPY(deviceid, tl, NFSX_V4DEVICEID);
4844	tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4845	*tl++ = txdr_unsigned(layouttype);
4846	*tl++ = txdr_unsigned(100000);
4847	if (notifybitsp != NULL && *notifybitsp != 0) {
4848		*tl = txdr_unsigned(1);		/* One word of bits. */
4849		NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
4850		*tl = txdr_unsigned(*notifybitsp);
4851	} else
4852		*tl = txdr_unsigned(0);
4853	nd->nd_flag |= ND_USEGSSNAME;
4854	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4855	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4856	if (error != 0)
4857		return (error);
4858	if (nd->nd_repstat == 0) {
4859		NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4860		if (layouttype != fxdr_unsigned(int, *tl++))
4861			printf("EEK! devinfo layout type not same!\n");
4862		stripecnt = fxdr_unsigned(int, *++tl);
4863		NFSCL_DEBUG(4, "stripecnt=%d\n", stripecnt);
4864		if (stripecnt < 1 || stripecnt > 4096) {
4865			printf("NFS devinfo stripecnt %d: out of range\n",
4866			    stripecnt);
4867			error = NFSERR_BADXDR;
4868			goto nfsmout;
4869		}
4870		NFSM_DISSECT(tl, uint32_t *, (stripecnt + 1) * NFSX_UNSIGNED);
4871		addrcnt = fxdr_unsigned(int, *(tl + stripecnt));
4872		NFSCL_DEBUG(4, "addrcnt=%d\n", addrcnt);
4873		if (addrcnt < 1 || addrcnt > 128) {
4874			printf("NFS devinfo addrcnt %d: out of range\n",
4875			    addrcnt);
4876			error = NFSERR_BADXDR;
4877			goto nfsmout;
4878		}
4879
4880		/*
4881		 * Now we know how many stripe indices and addresses, so
4882		 * we can allocate the structure the correct size.
4883		 */
4884		i = (stripecnt * sizeof(uint8_t)) / sizeof(struct nfsclds *)
4885		    + 1;
4886		NFSCL_DEBUG(4, "stripeindices=%d\n", i);
4887		ndi = malloc(sizeof(*ndi) + (addrcnt + i) *
4888		    sizeof(struct nfsclds *), M_NFSDEVINFO, M_WAITOK | M_ZERO);
4889		NFSBCOPY(deviceid, ndi->nfsdi_deviceid, NFSX_V4DEVICEID);
4890		ndi->nfsdi_refcnt = 0;
4891		ndi->nfsdi_stripecnt = stripecnt;
4892		ndi->nfsdi_addrcnt = addrcnt;
4893		/* Fill in the stripe indices. */
4894		for (i = 0; i < stripecnt; i++) {
4895			stripeindex = fxdr_unsigned(uint8_t, *tl++);
4896			NFSCL_DEBUG(4, "stripeind=%d\n", stripeindex);
4897			if (stripeindex >= addrcnt) {
4898				printf("NFS devinfo stripeindex %d: too big\n",
4899				    (int)stripeindex);
4900				error = NFSERR_BADXDR;
4901				goto nfsmout;
4902			}
4903			nfsfldi_setstripeindex(ndi, i, stripeindex);
4904		}
4905
4906		/* Now, dissect the server address(es). */
4907		safilled = 0;
4908		for (i = 0; i < addrcnt; i++) {
4909			NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4910			cnt = fxdr_unsigned(uint32_t, *tl);
4911			if (cnt == 0) {
4912				printf("NFS devinfo 0 len addrlist\n");
4913				error = NFSERR_BADXDR;
4914				goto nfsmout;
4915			}
4916			dspp = nfsfldi_addr(ndi, i);
4917			pos = arc4random() % cnt;	/* Choose one. */
4918			safilled = 0;
4919			for (j = 0; j < cnt; j++) {
4920				error = nfsv4_getipaddr(nd, &ss, &isudp);
4921				if (error != 0 && error != EPERM) {
4922					error = NFSERR_BADXDR;
4923					goto nfsmout;
4924				}
4925				if (error == 0 && isudp == 0) {
4926					/*
4927					 * The algorithm is:
4928					 * - use "pos" entry if it is of the
4929					 *   same af_family or none of them
4930					 *   is of the same af_family
4931					 * else
4932					 * - use the first one of the same
4933					 *   af_family.
4934					 */
4935					if ((safilled == 0 && ss.ss_family ==
4936					     nmp->nm_nam->sa_family) ||
4937					    (j == pos &&
4938					     (safilled == 0 || ss.ss_family ==
4939					      nmp->nm_nam->sa_family)) ||
4940					    (safilled == 1 && ss.ss_family ==
4941					     nmp->nm_nam->sa_family)) {
4942						error = nfsrpc_fillsa(nmp, &ss,
4943						    &dsp, p);
4944						if (error == 0) {
4945							*dspp = dsp;
4946							if (ss.ss_family ==
4947							 nmp->nm_nam->sa_family)
4948								safilled = 2;
4949							else
4950								safilled = 1;
4951						}
4952					}
4953				}
4954			}
4955			if (safilled == 0)
4956				break;
4957		}
4958
4959		/* And the notify bits. */
4960		NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4961		if (safilled != 0) {
4962			bitcnt = fxdr_unsigned(int, *tl);
4963			if (bitcnt > 0) {
4964				NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4965				if (notifybitsp != NULL)
4966					*notifybitsp =
4967					    fxdr_unsigned(uint32_t, *tl);
4968			}
4969			*ndip = ndi;
4970		} else
4971			error = EPERM;
4972	}
4973	if (nd->nd_repstat != 0)
4974		error = nd->nd_repstat;
4975nfsmout:
4976	if (error != 0 && ndi != NULL)
4977		nfscl_freedevinfo(ndi);
4978	mbuf_freem(nd->nd_mrep);
4979	return (error);
4980}
4981
4982/*
4983 * Do the NFSv4.1 LayoutCommit.
4984 */
4985int
4986nfsrpc_layoutcommit(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
4987    uint64_t off, uint64_t len, uint64_t lastbyte, nfsv4stateid_t *stateidp,
4988    int layouttype, int layoutupdatecnt, uint8_t *layp, struct ucred *cred,
4989    NFSPROC_T *p, void *stuff)
4990{
4991	uint32_t *tl;
4992	struct nfsrv_descript nfsd, *nd = &nfsd;
4993	int error, outcnt, i;
4994	uint8_t *cp;
4995
4996	nfscl_reqstart(nd, NFSPROC_LAYOUTCOMMIT, nmp, fh, fhlen, NULL, NULL);
4997	NFSM_BUILD(tl, uint32_t *, 5 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4998	    NFSX_STATEID);
4999	txdr_hyper(off, tl);
5000	tl += 2;
5001	txdr_hyper(len, tl);
5002	tl += 2;
5003	if (reclaim != 0)
5004		*tl++ = newnfs_true;
5005	else
5006		*tl++ = newnfs_false;
5007	*tl++ = txdr_unsigned(stateidp->seqid);
5008	*tl++ = stateidp->other[0];
5009	*tl++ = stateidp->other[1];
5010	*tl++ = stateidp->other[2];
5011	*tl++ = newnfs_true;
5012	if (lastbyte < off)
5013		lastbyte = off;
5014	else if (lastbyte >= (off + len))
5015		lastbyte = off + len - 1;
5016	txdr_hyper(lastbyte, tl);
5017	tl += 2;
5018	*tl++ = newnfs_false;
5019	*tl++ = txdr_unsigned(layouttype);
5020	*tl = txdr_unsigned(layoutupdatecnt);
5021	if (layoutupdatecnt > 0) {
5022		KASSERT(layouttype != NFSLAYOUT_NFSV4_1_FILES,
5023		    ("Must be nil for Files Layout"));
5024		outcnt = NFSM_RNDUP(layoutupdatecnt);
5025		NFSM_BUILD(cp, uint8_t *, outcnt);
5026		NFSBCOPY(layp, cp, layoutupdatecnt);
5027		cp += layoutupdatecnt;
5028		for (i = 0; i < (outcnt - layoutupdatecnt); i++)
5029			*cp++ = 0x0;
5030	}
5031	nd->nd_flag |= ND_USEGSSNAME;
5032	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5033	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5034	if (error != 0)
5035		return (error);
5036	error = nd->nd_repstat;
5037	mbuf_freem(nd->nd_mrep);
5038	return (error);
5039}
5040
5041/*
5042 * Do the NFSv4.1 LayoutReturn.
5043 */
5044int
5045nfsrpc_layoutreturn(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
5046    int layouttype, uint32_t iomode, int layoutreturn, uint64_t offset,
5047    uint64_t len, nfsv4stateid_t *stateidp, int layoutcnt, uint32_t *layp,
5048    struct ucred *cred, NFSPROC_T *p, void *stuff)
5049{
5050	uint32_t *tl;
5051	struct nfsrv_descript nfsd, *nd = &nfsd;
5052	int error, outcnt, i;
5053	uint8_t *cp;
5054
5055	nfscl_reqstart(nd, NFSPROC_LAYOUTRETURN, nmp, fh, fhlen, NULL, NULL);
5056	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
5057	if (reclaim != 0)
5058		*tl++ = newnfs_true;
5059	else
5060		*tl++ = newnfs_false;
5061	*tl++ = txdr_unsigned(layouttype);
5062	*tl++ = txdr_unsigned(iomode);
5063	*tl = txdr_unsigned(layoutreturn);
5064	if (layoutreturn == NFSLAYOUTRETURN_FILE) {
5065		NFSM_BUILD(tl, uint32_t *, 2 * NFSX_HYPER + NFSX_STATEID +
5066		    NFSX_UNSIGNED);
5067		txdr_hyper(offset, tl);
5068		tl += 2;
5069		txdr_hyper(len, tl);
5070		tl += 2;
5071		NFSCL_DEBUG(4, "layoutret stseq=%d\n", (int)stateidp->seqid);
5072		*tl++ = txdr_unsigned(stateidp->seqid);
5073		*tl++ = stateidp->other[0];
5074		*tl++ = stateidp->other[1];
5075		*tl++ = stateidp->other[2];
5076		*tl = txdr_unsigned(layoutcnt);
5077		if (layoutcnt > 0) {
5078			outcnt = NFSM_RNDUP(layoutcnt);
5079			NFSM_BUILD(cp, uint8_t *, outcnt);
5080			NFSBCOPY(layp, cp, layoutcnt);
5081			cp += layoutcnt;
5082			for (i = 0; i < (outcnt - layoutcnt); i++)
5083				*cp++ = 0x0;
5084		}
5085	}
5086	nd->nd_flag |= ND_USEGSSNAME;
5087	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5088	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5089	if (error != 0)
5090		return (error);
5091	if (nd->nd_repstat == 0) {
5092		NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5093		if (*tl != 0) {
5094			NFSM_DISSECT(tl, uint32_t *, NFSX_STATEID);
5095			stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
5096			stateidp->other[0] = *tl++;
5097			stateidp->other[1] = *tl++;
5098			stateidp->other[2] = *tl;
5099		}
5100	} else
5101		error = nd->nd_repstat;
5102nfsmout:
5103	mbuf_freem(nd->nd_mrep);
5104	return (error);
5105}
5106
5107/*
5108 * Acquire a layout and devinfo, if possible. The caller must have acquired
5109 * a reference count on the nfsclclient structure before calling this.
5110 * Return the layout in lypp with a reference count on it, if successful.
5111 */
5112static int
5113nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
5114    int iomode, uint32_t *notifybitsp, nfsv4stateid_t *stateidp, uint64_t off,
5115    struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
5116{
5117	struct nfscllayout *lyp;
5118	struct nfsclflayout *flp, *tflp;
5119	struct nfscldevinfo *dip;
5120	struct nfsclflayouthead flh;
5121	int error = 0, islocked, layoutlen, recalled, retonclose;
5122	nfsv4stateid_t stateid;
5123
5124	*lypp = NULL;
5125	/*
5126	 * If lyp is returned non-NULL, there will be a refcnt (shared lock)
5127	 * on it, iff flp != NULL or a lock (exclusive lock) on it iff
5128	 * flp == NULL.
5129	 */
5130	lyp = nfscl_getlayout(nmp->nm_clp, nfhp->nfh_fh, nfhp->nfh_len,
5131	    off, &flp, &recalled);
5132	islocked = 0;
5133	if (lyp == NULL || flp == NULL) {
5134		if (recalled != 0)
5135			return (EIO);
5136		LIST_INIT(&flh);
5137		layoutlen = NFSMNT_MDSSESSION(nmp)->nfsess_maxcache -
5138		    (NFSX_STATEID + 3 * NFSX_UNSIGNED);
5139		if (lyp == NULL) {
5140			stateid.seqid = 0;
5141			stateid.other[0] = stateidp->other[0];
5142			stateid.other[1] = stateidp->other[1];
5143			stateid.other[2] = stateidp->other[2];
5144			error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5145			    nfhp->nfh_len, iomode, (uint64_t)0, INT64_MAX,
5146			    (uint64_t)0, layoutlen, &stateid, &retonclose,
5147			    &flh, cred, p, NULL);
5148		} else {
5149			islocked = 1;
5150			stateid.seqid = lyp->nfsly_stateid.seqid;
5151			stateid.other[0] = lyp->nfsly_stateid.other[0];
5152			stateid.other[1] = lyp->nfsly_stateid.other[1];
5153			stateid.other[2] = lyp->nfsly_stateid.other[2];
5154			error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5155			    nfhp->nfh_len, iomode, off, INT64_MAX,
5156			    (uint64_t)0, layoutlen, &stateid, &retonclose,
5157			    &flh, cred, p, NULL);
5158		}
5159		if (error == 0)
5160			LIST_FOREACH(tflp, &flh, nfsfl_list) {
5161				error = nfscl_adddevinfo(nmp, NULL, tflp);
5162				if (error != 0) {
5163					error = nfsrpc_getdeviceinfo(nmp,
5164					    tflp->nfsfl_dev,
5165					    NFSLAYOUT_NFSV4_1_FILES,
5166					    notifybitsp, &dip, cred, p);
5167					if (error != 0)
5168						break;
5169					error = nfscl_adddevinfo(nmp, dip,
5170					    tflp);
5171					if (error != 0)
5172						printf(
5173						    "getlayout: cannot add\n");
5174				}
5175			}
5176		if (error == 0) {
5177			/*
5178			 * nfscl_layout() always returns with the nfsly_lock
5179			 * set to a refcnt (shared lock).
5180			 */
5181			error = nfscl_layout(nmp, vp, nfhp->nfh_fh,
5182			    nfhp->nfh_len, &stateid, retonclose, &flh, &lyp,
5183			    cred, p);
5184			if (error == 0)
5185				*lypp = lyp;
5186		} else if (islocked != 0)
5187			nfsv4_unlock(&lyp->nfsly_lock, 0);
5188	} else
5189		*lypp = lyp;
5190	return (error);
5191}
5192
5193/*
5194 * Do a TCP connection plus exchange id and create session.
5195 * If successful, a "struct nfsclds" is linked into the list for the
5196 * mount point and a pointer to it is returned.
5197 */
5198static int
5199nfsrpc_fillsa(struct nfsmount *nmp, struct sockaddr_storage *ssp,
5200    struct nfsclds **dspp, NFSPROC_T *p)
5201{
5202	struct sockaddr_in *msad, *sad, *ssd;
5203	struct sockaddr_in6 *msad6, *sad6, *ssd6;
5204	struct nfsclclient *clp;
5205	struct nfssockreq *nrp;
5206	struct nfsclds *dsp, *tdsp;
5207	int error;
5208	enum nfsclds_state retv;
5209	uint32_t sequenceid;
5210
5211	KASSERT(nmp->nm_sockreq.nr_cred != NULL,
5212	    ("nfsrpc_fillsa: NULL nr_cred"));
5213	NFSLOCKCLSTATE();
5214	clp = nmp->nm_clp;
5215	NFSUNLOCKCLSTATE();
5216	if (clp == NULL)
5217		return (EPERM);
5218	if (ssp->ss_family == AF_INET) {
5219		ssd = (struct sockaddr_in *)ssp;
5220		NFSLOCKMNT(nmp);
5221
5222		/*
5223		 * Check to see if we already have a session for this
5224		 * address that is usable for a DS.
5225		 * Note that the MDS's address is in a different place
5226		 * than the sessions already acquired for DS's.
5227		 */
5228		msad = (struct sockaddr_in *)nmp->nm_sockreq.nr_nam;
5229		tdsp = TAILQ_FIRST(&nmp->nm_sess);
5230		while (tdsp != NULL) {
5231			if (msad != NULL && msad->sin_family == AF_INET &&
5232			    ssd->sin_addr.s_addr == msad->sin_addr.s_addr &&
5233			    ssd->sin_port == msad->sin_port &&
5234			    (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5235				*dspp = tdsp;
5236				NFSUNLOCKMNT(nmp);
5237				NFSCL_DEBUG(4, "fnd same addr\n");
5238				return (0);
5239			}
5240			tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5241			if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5242				msad = (struct sockaddr_in *)
5243				    tdsp->nfsclds_sockp->nr_nam;
5244			else
5245				msad = NULL;
5246		}
5247		NFSUNLOCKMNT(nmp);
5248
5249		/* No IP address match, so look for new/trunked one. */
5250		sad = malloc(sizeof(*sad), M_SONAME, M_WAITOK | M_ZERO);
5251		sad->sin_len = sizeof(*sad);
5252		sad->sin_family = AF_INET;
5253		sad->sin_port = ssd->sin_port;
5254		sad->sin_addr.s_addr = ssd->sin_addr.s_addr;
5255		nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5256		nrp->nr_nam = (struct sockaddr *)sad;
5257	} else if (ssp->ss_family == AF_INET6) {
5258		ssd6 = (struct sockaddr_in6 *)ssp;
5259		NFSLOCKMNT(nmp);
5260
5261		/*
5262		 * Check to see if we already have a session for this
5263		 * address that is usable for a DS.
5264		 * Note that the MDS's address is in a different place
5265		 * than the sessions already acquired for DS's.
5266		 */
5267		msad6 = (struct sockaddr_in6 *)nmp->nm_sockreq.nr_nam;
5268		tdsp = TAILQ_FIRST(&nmp->nm_sess);
5269		while (tdsp != NULL) {
5270			if (msad6 != NULL && msad6->sin6_family == AF_INET6 &&
5271			    IN6_ARE_ADDR_EQUAL(&ssd6->sin6_addr,
5272			    &msad6->sin6_addr) &&
5273			    ssd6->sin6_port == msad6->sin6_port &&
5274			    (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5275				*dspp = tdsp;
5276				NFSUNLOCKMNT(nmp);
5277				return (0);
5278			}
5279			tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5280			if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5281				msad6 = (struct sockaddr_in6 *)
5282				    tdsp->nfsclds_sockp->nr_nam;
5283			else
5284				msad6 = NULL;
5285		}
5286		NFSUNLOCKMNT(nmp);
5287
5288		/* No IP address match, so look for new/trunked one. */
5289		sad6 = malloc(sizeof(*sad6), M_SONAME, M_WAITOK | M_ZERO);
5290		sad6->sin6_len = sizeof(*sad6);
5291		sad6->sin6_family = AF_INET6;
5292		sad6->sin6_port = ssd6->sin6_port;
5293		NFSBCOPY(&ssd6->sin6_addr, &sad6->sin6_addr,
5294		    sizeof(struct in6_addr));
5295		nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5296		nrp->nr_nam = (struct sockaddr *)sad6;
5297	} else
5298		return (EPERM);
5299
5300	nrp->nr_sotype = SOCK_STREAM;
5301	mtx_init(&nrp->nr_mtx, "nfssock", NULL, MTX_DEF);
5302	nrp->nr_prog = NFS_PROG;
5303	nrp->nr_vers = NFS_VER4;
5304
5305	/*
5306	 * Use the credentials that were used for the mount, which are
5307	 * in nmp->nm_sockreq.nr_cred for newnfs_connect() etc.
5308	 * Ref. counting the credentials with crhold() is probably not
5309	 * necessary, since nm_sockreq.nr_cred won't be crfree()'d until
5310	 * unmount, but I did it anyhow.
5311	 */
5312	nrp->nr_cred = crhold(nmp->nm_sockreq.nr_cred);
5313	error = newnfs_connect(nmp, nrp, NULL, p, 0);
5314	NFSCL_DEBUG(3, "DS connect=%d\n", error);
5315
5316	/* Now, do the exchangeid and create session. */
5317	if (error == 0)
5318		error = nfsrpc_exchangeid(nmp, clp, nrp, NFSV4EXCH_USEPNFSDS,
5319		    &dsp, nrp->nr_cred, p);
5320	NFSCL_DEBUG(3, "DS exchangeid=%d\n", error);
5321	if (error == 0) {
5322		dsp->nfsclds_sockp = nrp;
5323		NFSLOCKMNT(nmp);
5324		retv = nfscl_getsameserver(nmp, dsp, &tdsp);
5325		NFSCL_DEBUG(3, "getsame ret=%d\n", retv);
5326		if (retv == NFSDSP_USETHISSESSION) {
5327			NFSUNLOCKMNT(nmp);
5328			/*
5329			 * If there is already a session for this server,
5330			 * use it.
5331			 */
5332			(void)newnfs_disconnect(nrp);
5333			nfscl_freenfsclds(dsp);
5334			*dspp = tdsp;
5335			return (0);
5336		}
5337		if (retv == NFSDSP_SEQTHISSESSION)
5338			sequenceid = tdsp->nfsclds_sess.nfsess_sequenceid;
5339		else
5340			sequenceid = dsp->nfsclds_sess.nfsess_sequenceid;
5341		NFSUNLOCKMNT(nmp);
5342		error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
5343		    nrp, sequenceid, 0, nrp->nr_cred, p);
5344		NFSCL_DEBUG(3, "DS createsess=%d\n", error);
5345	} else {
5346		NFSFREECRED(nrp->nr_cred);
5347		NFSFREEMUTEX(&nrp->nr_mtx);
5348		free(nrp->nr_nam, M_SONAME);
5349		free(nrp, M_NFSSOCKREQ);
5350	}
5351	if (error == 0) {
5352		NFSCL_DEBUG(3, "add DS session\n");
5353		/*
5354		 * Put it at the end of the list. That way the list
5355		 * is ordered by when the entry was added. This matters
5356		 * since the one done first is the one that should be
5357		 * used for sequencid'ing any subsequent create sessions.
5358		 */
5359		NFSLOCKMNT(nmp);
5360		TAILQ_INSERT_TAIL(&nmp->nm_sess, dsp, nfsclds_list);
5361		NFSUNLOCKMNT(nmp);
5362		*dspp = dsp;
5363	} else if (dsp != NULL)
5364		nfscl_freenfsclds(dsp);
5365	return (error);
5366}
5367
5368/*
5369 * Do the NFSv4.1 Reclaim Complete.
5370 */
5371int
5372nfsrpc_reclaimcomplete(struct nfsmount *nmp, struct ucred *cred, NFSPROC_T *p)
5373{
5374	uint32_t *tl;
5375	struct nfsrv_descript nfsd;
5376	struct nfsrv_descript *nd = &nfsd;
5377	int error;
5378
5379	nfscl_reqstart(nd, NFSPROC_RECLAIMCOMPL, nmp, NULL, 0, NULL, NULL);
5380	NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
5381	*tl = newnfs_false;
5382	nd->nd_flag |= ND_USEGSSNAME;
5383	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5384	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5385	if (error != 0)
5386		return (error);
5387	error = nd->nd_repstat;
5388	mbuf_freem(nd->nd_mrep);
5389	return (error);
5390}
5391
5392/*
5393 * Initialize the slot tables for a session.
5394 */
5395static void
5396nfscl_initsessionslots(struct nfsclsession *sep)
5397{
5398	int i;
5399
5400	for (i = 0; i < NFSV4_CBSLOTS; i++) {
5401		if (sep->nfsess_cbslots[i].nfssl_reply != NULL)
5402			m_freem(sep->nfsess_cbslots[i].nfssl_reply);
5403		NFSBZERO(&sep->nfsess_cbslots[i], sizeof(struct nfsslot));
5404	}
5405	for (i = 0; i < 64; i++)
5406		sep->nfsess_slotseq[i] = 0;
5407	sep->nfsess_slots = 0;
5408}
5409
5410/*
5411 * Called to try and do an I/O operation via an NFSv4.1 Data Server (DS).
5412 */
5413int
5414nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5415    uint32_t rwaccess, struct ucred *cred, NFSPROC_T *p)
5416{
5417	struct nfsnode *np = VTONFS(vp);
5418	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5419	struct nfscllayout *layp;
5420	struct nfscldevinfo *dip;
5421	struct nfsclflayout *rflp;
5422	nfsv4stateid_t stateid;
5423	struct ucred *newcred;
5424	uint64_t lastbyte, len, off, oresid, xfer;
5425	int eof, error, iolaymode, recalled;
5426	void *lckp;
5427
5428	if (!NFSHASPNFS(nmp) || nfscl_enablecallb == 0 || nfs_numnfscbd == 0 ||
5429	    (np->n_flag & NNOLAYOUT) != 0)
5430		return (EIO);
5431	/* Now, get a reference cnt on the clientid for this mount. */
5432	if (nfscl_getref(nmp) == 0)
5433		return (EIO);
5434
5435	/* Find an appropriate stateid. */
5436	newcred = NFSNEWCRED(cred);
5437	error = nfscl_getstateid(vp, np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
5438	    rwaccess, 1, newcred, p, &stateid, &lckp);
5439	if (error != 0) {
5440		NFSFREECRED(newcred);
5441		nfscl_relref(nmp);
5442		return (error);
5443	}
5444	/* Search for a layout for this file. */
5445	off = uiop->uio_offset;
5446	layp = nfscl_getlayout(nmp->nm_clp, np->n_fhp->nfh_fh,
5447	    np->n_fhp->nfh_len, off, &rflp, &recalled);
5448	if (layp == NULL || rflp == NULL) {
5449		if (recalled != 0) {
5450			NFSFREECRED(newcred);
5451			nfscl_relref(nmp);
5452			return (EIO);
5453		}
5454		if (layp != NULL) {
5455			nfscl_rellayout(layp, (rflp == NULL) ? 1 : 0);
5456			layp = NULL;
5457		}
5458		/* Try and get a Layout, if it is supported. */
5459		if (rwaccess == NFSV4OPEN_ACCESSWRITE ||
5460		    (np->n_flag & NWRITEOPENED) != 0)
5461			iolaymode = NFSLAYOUTIOMODE_RW;
5462		else
5463			iolaymode = NFSLAYOUTIOMODE_READ;
5464		error = nfsrpc_getlayout(nmp, vp, np->n_fhp, iolaymode,
5465		    NULL, &stateid, off, &layp, newcred, p);
5466		if (error != 0) {
5467			NFSLOCKNODE(np);
5468			np->n_flag |= NNOLAYOUT;
5469			NFSUNLOCKNODE(np);
5470			if (lckp != NULL)
5471				nfscl_lockderef(lckp);
5472			NFSFREECRED(newcred);
5473			if (layp != NULL)
5474				nfscl_rellayout(layp, 0);
5475			nfscl_relref(nmp);
5476			return (error);
5477		}
5478	}
5479
5480	/*
5481	 * Loop around finding a layout that works for the first part of
5482	 * this I/O operation, and then call the function that actually
5483	 * does the RPC.
5484	 */
5485	eof = 0;
5486	len = (uint64_t)uiop->uio_resid;
5487	while (len > 0 && error == 0 && eof == 0) {
5488		off = uiop->uio_offset;
5489		error = nfscl_findlayoutforio(layp, off, rwaccess, &rflp);
5490		if (error == 0) {
5491			oresid = xfer = (uint64_t)uiop->uio_resid;
5492			if (xfer > (rflp->nfsfl_end - rflp->nfsfl_off))
5493				xfer = rflp->nfsfl_end - rflp->nfsfl_off;
5494			dip = nfscl_getdevinfo(nmp->nm_clp, rflp->nfsfl_dev,
5495			    rflp->nfsfl_devp);
5496			if (dip != NULL) {
5497				error = nfscl_doflayoutio(vp, uiop, iomode,
5498				    must_commit, &eof, &stateid, rwaccess, dip,
5499				    layp, rflp, off, xfer, newcred, p);
5500				nfscl_reldevinfo(dip);
5501				lastbyte = off + xfer - 1;
5502				if (error == 0) {
5503					NFSLOCKCLSTATE();
5504					if (lastbyte > layp->nfsly_lastbyte)
5505						layp->nfsly_lastbyte = lastbyte;
5506					NFSUNLOCKCLSTATE();
5507				}
5508			} else
5509				error = EIO;
5510			if (error == 0)
5511				len -= (oresid - (uint64_t)uiop->uio_resid);
5512		}
5513	}
5514	if (lckp != NULL)
5515		nfscl_lockderef(lckp);
5516	NFSFREECRED(newcred);
5517	nfscl_rellayout(layp, 0);
5518	nfscl_relref(nmp);
5519	return (error);
5520}
5521
5522/*
5523 * Find a file layout that will handle the first bytes of the requested
5524 * range and return the information from it needed to to the I/O operation.
5525 */
5526int
5527nfscl_findlayoutforio(struct nfscllayout *lyp, uint64_t off, uint32_t rwaccess,
5528    struct nfsclflayout **retflpp)
5529{
5530	struct nfsclflayout *flp, *nflp, *rflp;
5531	uint32_t rw;
5532
5533	rflp = NULL;
5534	rw = rwaccess;
5535	/* For reading, do the Read list first and then the Write list. */
5536	do {
5537		if (rw == NFSV4OPEN_ACCESSREAD)
5538			flp = LIST_FIRST(&lyp->nfsly_flayread);
5539		else
5540			flp = LIST_FIRST(&lyp->nfsly_flayrw);
5541		while (flp != NULL) {
5542			nflp = LIST_NEXT(flp, nfsfl_list);
5543			if (flp->nfsfl_off > off)
5544				break;
5545			if (flp->nfsfl_end > off &&
5546			    (rflp == NULL || rflp->nfsfl_end < flp->nfsfl_end))
5547				rflp = flp;
5548			flp = nflp;
5549		}
5550		if (rw == NFSV4OPEN_ACCESSREAD)
5551			rw = NFSV4OPEN_ACCESSWRITE;
5552		else
5553			rw = 0;
5554	} while (rw != 0);
5555	if (rflp != NULL) {
5556		/* This one covers the most bytes starting at off. */
5557		*retflpp = rflp;
5558		return (0);
5559	}
5560	return (EIO);
5561}
5562
5563/*
5564 * Do I/O using an NFSv4.1 file layout.
5565 */
5566static int
5567nfscl_doflayoutio(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5568    int *eofp, nfsv4stateid_t *stateidp, int rwflag, struct nfscldevinfo *dp,
5569    struct nfscllayout *lyp, struct nfsclflayout *flp, uint64_t off,
5570    uint64_t len, struct ucred *cred, NFSPROC_T *p)
5571{
5572	uint64_t io_off, rel_off, stripe_unit_size, transfer, xfer;
5573	int commit_thru_mds, error = 0, stripe_index, stripe_pos;
5574	struct nfsnode *np;
5575	struct nfsfh *fhp;
5576	struct nfsclds **dspp;
5577
5578	np = VTONFS(vp);
5579	rel_off = off - flp->nfsfl_patoff;
5580	stripe_unit_size = (flp->nfsfl_util >> 6) & 0x3ffffff;
5581	stripe_pos = (rel_off / stripe_unit_size + flp->nfsfl_stripe1) %
5582	    dp->nfsdi_stripecnt;
5583	transfer = stripe_unit_size - (rel_off % stripe_unit_size);
5584
5585	/* Loop around, doing I/O for each stripe unit. */
5586	while (len > 0 && error == 0) {
5587		stripe_index = nfsfldi_stripeindex(dp, stripe_pos);
5588		dspp = nfsfldi_addr(dp, stripe_index);
5589		if (len > transfer)
5590			xfer = transfer;
5591		else
5592			xfer = len;
5593		if ((flp->nfsfl_util & NFSFLAYUTIL_DENSE) != 0) {
5594			/* Dense layout. */
5595			if (stripe_pos >= flp->nfsfl_fhcnt)
5596				return (EIO);
5597			fhp = flp->nfsfl_fh[stripe_pos];
5598			io_off = (rel_off / (stripe_unit_size *
5599			    dp->nfsdi_stripecnt)) * stripe_unit_size +
5600			    rel_off % stripe_unit_size;
5601		} else {
5602			/* Sparse layout. */
5603			if (flp->nfsfl_fhcnt > 1) {
5604				if (stripe_index >= flp->nfsfl_fhcnt)
5605					return (EIO);
5606				fhp = flp->nfsfl_fh[stripe_index];
5607			} else if (flp->nfsfl_fhcnt == 1)
5608				fhp = flp->nfsfl_fh[0];
5609			else
5610				fhp = np->n_fhp;
5611			io_off = off;
5612		}
5613		if ((flp->nfsfl_util & NFSFLAYUTIL_COMMIT_THRU_MDS) != 0)
5614			commit_thru_mds = 1;
5615		else
5616			commit_thru_mds = 0;
5617		if (rwflag == FREAD)
5618			error = nfsrpc_readds(vp, uiop, stateidp, eofp, *dspp,
5619			    io_off, xfer, fhp, cred, p);
5620		else {
5621			error = nfsrpc_writeds(vp, uiop, iomode, must_commit,
5622			    stateidp, *dspp, io_off, xfer, fhp, commit_thru_mds,
5623			    cred, p);
5624			if (error == 0) {
5625				NFSLOCKCLSTATE();
5626				lyp->nfsly_flags |= NFSLY_WRITTEN;
5627				NFSUNLOCKCLSTATE();
5628			}
5629		}
5630		if (error == 0) {
5631			transfer = stripe_unit_size;
5632			stripe_pos = (stripe_pos + 1) % dp->nfsdi_stripecnt;
5633			len -= xfer;
5634			off += xfer;
5635		}
5636	}
5637	return (error);
5638}
5639
5640/*
5641 * The actual read RPC done to a DS.
5642 */
5643static int
5644nfsrpc_readds(vnode_t vp, struct uio *uiop, nfsv4stateid_t *stateidp, int *eofp,
5645    struct nfsclds *dsp, uint64_t io_off, int len, struct nfsfh *fhp,
5646    struct ucred *cred, NFSPROC_T *p)
5647{
5648	uint32_t *tl;
5649	int error, retlen;
5650	struct nfsrv_descript nfsd;
5651	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5652	struct nfsrv_descript *nd = &nfsd;
5653	struct nfssockreq *nrp;
5654
5655	nd->nd_mrep = NULL;
5656	nfscl_reqstart(nd, NFSPROC_READDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5657	    NULL, &dsp->nfsclds_sess);
5658	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5659	NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED * 3);
5660	txdr_hyper(io_off, tl);
5661	*(tl + 2) = txdr_unsigned(len);
5662	nrp = dsp->nfsclds_sockp;
5663	if (nrp == NULL)
5664		/* If NULL, use the MDS socket. */
5665		nrp = &nmp->nm_sockreq;
5666	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5667	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5668	if (error != 0)
5669		return (error);
5670	if (nd->nd_repstat != 0) {
5671		error = nd->nd_repstat;
5672		goto nfsmout;
5673	}
5674	NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5675	*eofp = fxdr_unsigned(int, *tl);
5676	NFSM_STRSIZ(retlen, len);
5677	error = nfsm_mbufuio(nd, uiop, retlen);
5678nfsmout:
5679	if (nd->nd_mrep != NULL)
5680		mbuf_freem(nd->nd_mrep);
5681	return (error);
5682}
5683
5684/*
5685 * The actual write RPC done to a DS.
5686 */
5687static int
5688nfsrpc_writeds(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5689    nfsv4stateid_t *stateidp, struct nfsclds *dsp, uint64_t io_off, int len,
5690    struct nfsfh *fhp, int commit_thru_mds, struct ucred *cred, NFSPROC_T *p)
5691{
5692	uint32_t *tl;
5693	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5694	int error, rlen, commit, committed = NFSWRITE_FILESYNC;
5695	int32_t backup;
5696	struct nfsrv_descript nfsd;
5697	struct nfsrv_descript *nd = &nfsd;
5698	struct nfssockreq *nrp;
5699
5700	KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
5701	nd->nd_mrep = NULL;
5702	nfscl_reqstart(nd, NFSPROC_WRITEDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5703	    NULL, &dsp->nfsclds_sess);
5704	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5705	NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + 2 * NFSX_UNSIGNED);
5706	txdr_hyper(io_off, tl);
5707	tl += 2;
5708	*tl++ = txdr_unsigned(*iomode);
5709	*tl = txdr_unsigned(len);
5710	nfsm_uiombuf(nd, uiop, len);
5711	nrp = dsp->nfsclds_sockp;
5712	if (nrp == NULL)
5713		/* If NULL, use the MDS socket. */
5714		nrp = &nmp->nm_sockreq;
5715	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5716	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5717	if (error != 0)
5718		return (error);
5719	if (nd->nd_repstat != 0) {
5720		/*
5721		 * In case the rpc gets retried, roll
5722		 * the uio fileds changed by nfsm_uiombuf()
5723		 * back.
5724		 */
5725		uiop->uio_offset -= len;
5726		uio_uio_resid_add(uiop, len);
5727		uio_iov_base_add(uiop, -len);
5728		uio_iov_len_add(uiop, len);
5729		error = nd->nd_repstat;
5730	} else {
5731		NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_VERF);
5732		rlen = fxdr_unsigned(int, *tl++);
5733		if (rlen == 0) {
5734			error = NFSERR_IO;
5735			goto nfsmout;
5736		} else if (rlen < len) {
5737			backup = len - rlen;
5738			uio_iov_base_add(uiop, -(backup));
5739			uio_iov_len_add(uiop, backup);
5740			uiop->uio_offset -= backup;
5741			uio_uio_resid_add(uiop, backup);
5742			len = rlen;
5743		}
5744		commit = fxdr_unsigned(int, *tl++);
5745
5746		/*
5747		 * Return the lowest committment level
5748		 * obtained by any of the RPCs.
5749		 */
5750		if (committed == NFSWRITE_FILESYNC)
5751			committed = commit;
5752		else if (committed == NFSWRITE_DATASYNC &&
5753		    commit == NFSWRITE_UNSTABLE)
5754			committed = commit;
5755		if (commit_thru_mds != 0) {
5756			NFSLOCKMNT(nmp);
5757			if (!NFSHASWRITEVERF(nmp)) {
5758				NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5759				NFSSETWRITEVERF(nmp);
5760	    		} else if (NFSBCMP(tl, nmp->nm_verf, NFSX_VERF)) {
5761				*must_commit = 1;
5762				NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5763			}
5764			NFSUNLOCKMNT(nmp);
5765		} else {
5766			NFSLOCKDS(dsp);
5767			if ((dsp->nfsclds_flags & NFSCLDS_HASWRITEVERF) == 0) {
5768				NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5769				dsp->nfsclds_flags |= NFSCLDS_HASWRITEVERF;
5770			} else if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5771				*must_commit = 1;
5772				NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5773			}
5774			NFSUNLOCKDS(dsp);
5775		}
5776	}
5777nfsmout:
5778	if (nd->nd_mrep != NULL)
5779		mbuf_freem(nd->nd_mrep);
5780	*iomode = committed;
5781	if (nd->nd_repstat != 0 && error == 0)
5782		error = nd->nd_repstat;
5783	return (error);
5784}
5785
5786/*
5787 * Free up the nfsclds structure.
5788 */
5789void
5790nfscl_freenfsclds(struct nfsclds *dsp)
5791{
5792	int i;
5793
5794	if (dsp == NULL)
5795		return;
5796	if (dsp->nfsclds_sockp != NULL) {
5797		NFSFREECRED(dsp->nfsclds_sockp->nr_cred);
5798		NFSFREEMUTEX(&dsp->nfsclds_sockp->nr_mtx);
5799		free(dsp->nfsclds_sockp->nr_nam, M_SONAME);
5800		free(dsp->nfsclds_sockp, M_NFSSOCKREQ);
5801	}
5802	NFSFREEMUTEX(&dsp->nfsclds_mtx);
5803	NFSFREEMUTEX(&dsp->nfsclds_sess.nfsess_mtx);
5804	for (i = 0; i < NFSV4_CBSLOTS; i++) {
5805		if (dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply != NULL)
5806			m_freem(
5807			    dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply);
5808	}
5809	free(dsp, M_NFSCLDS);
5810}
5811
5812static enum nfsclds_state
5813nfscl_getsameserver(struct nfsmount *nmp, struct nfsclds *newdsp,
5814    struct nfsclds **retdspp)
5815{
5816	struct nfsclds *dsp, *cur_dsp;
5817
5818	/*
5819	 * Search the list of nfsclds structures for one with the same
5820	 * server.
5821	 */
5822	cur_dsp = NULL;
5823	TAILQ_FOREACH(dsp, &nmp->nm_sess, nfsclds_list) {
5824		if (dsp->nfsclds_servownlen == newdsp->nfsclds_servownlen &&
5825		    dsp->nfsclds_servownlen != 0 &&
5826		    !NFSBCMP(dsp->nfsclds_serverown, newdsp->nfsclds_serverown,
5827		    dsp->nfsclds_servownlen)) {
5828			NFSCL_DEBUG(4, "fnd same fdsp=%p dsp=%p flg=0x%x\n",
5829			    TAILQ_FIRST(&nmp->nm_sess), dsp,
5830			    dsp->nfsclds_flags);
5831			/* Server major id matches. */
5832			if ((dsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5833				*retdspp = dsp;
5834				return (NFSDSP_USETHISSESSION);
5835			}
5836
5837			/*
5838			 * Note the first match, so it can be used for
5839			 * sequence'ing new sessions.
5840			 */
5841			if (cur_dsp == NULL)
5842				cur_dsp = dsp;
5843		}
5844	}
5845	if (cur_dsp != NULL) {
5846		*retdspp = cur_dsp;
5847		return (NFSDSP_SEQTHISSESSION);
5848	}
5849	return (NFSDSP_NOTFOUND);
5850}
5851
5852#ifdef notyet
5853/*
5854 * NFS commit rpc to a DS.
5855 */
5856static int
5857nfsrpc_commitds(vnode_t vp, uint64_t offset, int cnt, struct nfsclds *dsp,
5858    struct nfsfh *fhp, struct ucred *cred, NFSPROC_T *p, void *stuff)
5859{
5860	uint32_t *tl;
5861	struct nfsrv_descript nfsd, *nd = &nfsd;
5862	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5863	struct nfssockreq *nrp;
5864	int error;
5865
5866	nfscl_reqstart(nd, NFSPROC_COMMITDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5867	    NULL, &dsp->nfsclds_sess);
5868	NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + NFSX_UNSIGNED);
5869	txdr_hyper(offset, tl);
5870	tl += 2;
5871	*tl = txdr_unsigned(cnt);
5872	nrp = dsp->nfsclds_sockp;
5873	if (nrp == NULL)
5874		/* If NULL, use the MDS socket. */
5875		nrp = &nmp->nm_sockreq;
5876	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5877	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5878	if (error)
5879		return (error);
5880	if (nd->nd_repstat == 0) {
5881		NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
5882		NFSLOCKDS(dsp);
5883		if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5884			NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5885			error = NFSERR_STALEWRITEVERF;
5886		}
5887		NFSUNLOCKDS(dsp);
5888	}
5889nfsmout:
5890	if (error == 0 && nd->nd_repstat != 0)
5891		error = nd->nd_repstat;
5892	mbuf_freem(nd->nd_mrep);
5893	return (error);
5894}
5895#endif
5896
5897