1/*-
2 * Copyright (c) 1989, 1993
3 *	The Regents of the University of California.  All rights reserved.
4 *
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 * 4. Neither the name of the University nor the names of its contributors
17 *    may be used to endorse or promote products derived from this software
18 *    without specific prior written permission.
19 *
20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 * SUCH DAMAGE.
31 *
32 */
33
34#include <sys/cdefs.h>
35__FBSDID("$FreeBSD$");
36
37/*
38 * Rpc op calls, generally called from the vnode op calls or through the
39 * buffer cache, for NFS v2, 3 and 4.
40 * These do not normally make any changes to vnode arguments or use
41 * structures that might change between the VFS variants. The returned
42 * arguments are all at the end, after the NFSPROC_T *p one.
43 */
44
45#ifndef APPLEKEXT
46#include "opt_inet6.h"
47
48#include <fs/nfs/nfsport.h>
49
50/*
51 * Global variables
52 */
53extern int nfs_numnfscbd;
54extern struct timeval nfsboottime;
55extern u_int32_t newnfs_false, newnfs_true;
56extern nfstype nfsv34_type[9];
57extern int nfsrv_useacl;
58extern char nfsv4_callbackaddr[INET6_ADDRSTRLEN];
59extern int nfscl_debuglevel;
60NFSCLSTATEMUTEX;
61int nfstest_outofseq = 0;
62int nfscl_assumeposixlocks = 1;
63int nfscl_enablecallb = 0;
64short nfsv4_cbport = NFSV4_CBPORT;
65int nfstest_openallsetattr = 0;
66#endif	/* !APPLEKEXT */
67
68#define	DIRHDSIZ	(sizeof (struct dirent) - (MAXNAMLEN + 1))
69
70/*
71 * nfscl_getsameserver() can return one of three values:
72 * NFSDSP_USETHISSESSION - Use this session for the DS.
73 * NFSDSP_SEQTHISSESSION - Use the nfsclds_sequence field of this dsp for new
74 *     session.
75 * NFSDSP_NOTFOUND - No matching server was found.
76 */
77enum nfsclds_state {
78	NFSDSP_USETHISSESSION = 0,
79	NFSDSP_SEQTHISSESSION = 1,
80	NFSDSP_NOTFOUND = 2,
81};
82
83static int nfsrpc_setattrrpc(vnode_t , struct vattr *, nfsv4stateid_t *,
84    struct ucred *, NFSPROC_T *, struct nfsvattr *, int *, void *);
85static int nfsrpc_readrpc(vnode_t , struct uio *, struct ucred *,
86    nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *, void *);
87static int nfsrpc_writerpc(vnode_t , struct uio *, int *, int *,
88    struct ucred *, nfsv4stateid_t *, NFSPROC_T *, struct nfsvattr *, int *,
89    void *);
90static int nfsrpc_createv23(vnode_t , char *, int, struct vattr *,
91    nfsquad_t, int, struct ucred *, NFSPROC_T *, struct nfsvattr *,
92    struct nfsvattr *, struct nfsfh **, int *, int *, void *);
93static int nfsrpc_createv4(vnode_t , char *, int, struct vattr *,
94    nfsquad_t, int, struct nfsclowner *, struct nfscldeleg **, struct ucred *,
95    NFSPROC_T *, struct nfsvattr *, struct nfsvattr *, struct nfsfh **, int *,
96    int *, void *, int *);
97static int nfsrpc_locku(struct nfsrv_descript *, struct nfsmount *,
98    struct nfscllockowner *, u_int64_t, u_int64_t,
99    u_int32_t, struct ucred *, NFSPROC_T *, int);
100static int nfsrpc_setaclrpc(vnode_t, struct ucred *, NFSPROC_T *,
101    struct acl *, nfsv4stateid_t *, void *);
102static int nfsrpc_getlayout(struct nfsmount *, vnode_t, struct nfsfh *, int,
103    uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
104    struct ucred *, NFSPROC_T *);
105static int nfsrpc_fillsa(struct nfsmount *, struct sockaddr_storage *,
106    struct nfsclds **, NFSPROC_T *);
107static void nfscl_initsessionslots(struct nfsclsession *);
108static int nfscl_doflayoutio(vnode_t, struct uio *, int *, int *, int *,
109    nfsv4stateid_t *, int, struct nfscldevinfo *, struct nfscllayout *,
110    struct nfsclflayout *, uint64_t, uint64_t, struct ucred *, NFSPROC_T *);
111static int nfsrpc_readds(vnode_t, struct uio *, nfsv4stateid_t *, int *,
112    struct nfsclds *, uint64_t, int, struct nfsfh *, struct ucred *,
113    NFSPROC_T *);
114static int nfsrpc_writeds(vnode_t, struct uio *, int *, int *,
115    nfsv4stateid_t *, struct nfsclds *, uint64_t, int,
116    struct nfsfh *, int, struct ucred *, NFSPROC_T *);
117static enum nfsclds_state nfscl_getsameserver(struct nfsmount *,
118    struct nfsclds *, struct nfsclds **);
119#ifdef notyet
120static int nfsrpc_commitds(vnode_t, uint64_t, int, struct nfsclds *,
121    struct nfsfh *, struct ucred *, NFSPROC_T *, void *);
122#endif
123
124/*
125 * nfs null call from vfs.
126 */
127APPLESTATIC int
128nfsrpc_null(vnode_t vp, struct ucred *cred, NFSPROC_T *p)
129{
130	int error;
131	struct nfsrv_descript nfsd, *nd = &nfsd;
132
133	NFSCL_REQSTART(nd, NFSPROC_NULL, vp);
134	error = nfscl_request(nd, vp, p, cred, NULL);
135	if (nd->nd_repstat && !error)
136		error = nd->nd_repstat;
137	mbuf_freem(nd->nd_mrep);
138	return (error);
139}
140
141/*
142 * nfs access rpc op.
143 * For nfs version 3 and 4, use the access rpc to check accessibility. If file
144 * modes are changed on the server, accesses might still fail later.
145 */
146APPLESTATIC int
147nfsrpc_access(vnode_t vp, int acmode, struct ucred *cred,
148    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp)
149{
150	int error;
151	u_int32_t mode, rmode;
152
153	if (acmode & VREAD)
154		mode = NFSACCESS_READ;
155	else
156		mode = 0;
157	if (vnode_vtype(vp) == VDIR) {
158		if (acmode & VWRITE)
159			mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND |
160				 NFSACCESS_DELETE);
161		if (acmode & VEXEC)
162			mode |= NFSACCESS_LOOKUP;
163	} else {
164		if (acmode & VWRITE)
165			mode |= (NFSACCESS_MODIFY | NFSACCESS_EXTEND);
166		if (acmode & VEXEC)
167			mode |= NFSACCESS_EXECUTE;
168	}
169
170	/*
171	 * Now, just call nfsrpc_accessrpc() to do the actual RPC.
172	 */
173	error = nfsrpc_accessrpc(vp, mode, cred, p, nap, attrflagp, &rmode,
174	    NULL);
175
176	/*
177	 * The NFS V3 spec does not clarify whether or not
178	 * the returned access bits can be a superset of
179	 * the ones requested, so...
180	 */
181	if (!error && (rmode & mode) != mode)
182		error = EACCES;
183	return (error);
184}
185
186/*
187 * The actual rpc, separated out for Darwin.
188 */
189APPLESTATIC int
190nfsrpc_accessrpc(vnode_t vp, u_int32_t mode, struct ucred *cred,
191    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, u_int32_t *rmodep,
192    void *stuff)
193{
194	u_int32_t *tl;
195	u_int32_t supported, rmode;
196	int error;
197	struct nfsrv_descript nfsd, *nd = &nfsd;
198	nfsattrbit_t attrbits;
199
200	*attrflagp = 0;
201	supported = mode;
202	NFSCL_REQSTART(nd, NFSPROC_ACCESS, vp);
203	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
204	*tl = txdr_unsigned(mode);
205	if (nd->nd_flag & ND_NFSV4) {
206		/*
207		 * And do a Getattr op.
208		 */
209		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
210		*tl = txdr_unsigned(NFSV4OP_GETATTR);
211		NFSGETATTR_ATTRBIT(&attrbits);
212		(void) nfsrv_putattrbit(nd, &attrbits);
213	}
214	error = nfscl_request(nd, vp, p, cred, stuff);
215	if (error)
216		return (error);
217	if (nd->nd_flag & ND_NFSV3) {
218		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
219		if (error)
220			goto nfsmout;
221	}
222	if (!nd->nd_repstat) {
223		if (nd->nd_flag & ND_NFSV4) {
224			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
225			supported = fxdr_unsigned(u_int32_t, *tl++);
226		} else {
227			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
228		}
229		rmode = fxdr_unsigned(u_int32_t, *tl);
230		if (nd->nd_flag & ND_NFSV4)
231			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
232
233		/*
234		 * It's not obvious what should be done about
235		 * unsupported access modes. For now, be paranoid
236		 * and clear the unsupported ones.
237		 */
238		rmode &= supported;
239		*rmodep = rmode;
240	} else
241		error = nd->nd_repstat;
242nfsmout:
243	mbuf_freem(nd->nd_mrep);
244	return (error);
245}
246
247/*
248 * nfs open rpc
249 */
250APPLESTATIC int
251nfsrpc_open(vnode_t vp, int amode, struct ucred *cred, NFSPROC_T *p)
252{
253	struct nfsclopen *op;
254	struct nfscldeleg *dp;
255	struct nfsfh *nfhp;
256	struct nfsnode *np = VTONFS(vp);
257	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
258	u_int32_t mode, clidrev;
259	int ret, newone, error, expireret = 0, retrycnt;
260
261	/*
262	 * For NFSv4, Open Ops are only done on Regular Files.
263	 */
264	if (vnode_vtype(vp) != VREG)
265		return (0);
266	mode = 0;
267	if (amode & FREAD)
268		mode |= NFSV4OPEN_ACCESSREAD;
269	if (amode & FWRITE)
270		mode |= NFSV4OPEN_ACCESSWRITE;
271	nfhp = np->n_fhp;
272
273	retrycnt = 0;
274#ifdef notdef
275{ char name[100]; int namel;
276namel = (np->n_v4->n4_namelen < 100) ? np->n_v4->n4_namelen : 99;
277bcopy(NFS4NODENAME(np->n_v4), name, namel);
278name[namel] = '\0';
279printf("rpcopen p=0x%x name=%s",p->p_pid,name);
280if (nfhp->nfh_len > 0) printf(" fh=0x%x\n",nfhp->nfh_fh[12]);
281else printf(" fhl=0\n");
282}
283#endif
284	do {
285	    dp = NULL;
286	    error = nfscl_open(vp, nfhp->nfh_fh, nfhp->nfh_len, mode, 1,
287		cred, p, NULL, &op, &newone, &ret, 1);
288	    if (error) {
289		return (error);
290	    }
291	    if (nmp->nm_clp != NULL)
292		clidrev = nmp->nm_clp->nfsc_clientidrev;
293	    else
294		clidrev = 0;
295	    if (ret == NFSCLOPEN_DOOPEN) {
296		if (np->n_v4 != NULL) {
297			error = nfsrpc_openrpc(nmp, vp, np->n_v4->n4_data,
298			   np->n_v4->n4_fhlen, np->n_fhp->nfh_fh,
299			   np->n_fhp->nfh_len, mode, op,
300			   NFS4NODENAME(np->n_v4), np->n_v4->n4_namelen, &dp,
301			   0, 0x0, cred, p, 0, 0);
302			if (dp != NULL) {
303#ifdef APPLE
304				OSBitAndAtomic((int32_t)~NDELEGMOD, (UInt32 *)&np->n_flag);
305#else
306				NFSLOCKNODE(np);
307				np->n_flag &= ~NDELEGMOD;
308				/*
309				 * Invalidate the attribute cache, so that
310				 * attributes that pre-date the issue of a
311				 * delegation are not cached, since the
312				 * cached attributes will remain valid while
313				 * the delegation is held.
314				 */
315				NFSINVALATTRCACHE(np);
316				NFSUNLOCKNODE(np);
317#endif
318				(void) nfscl_deleg(nmp->nm_mountp,
319				    op->nfso_own->nfsow_clp,
320				    nfhp->nfh_fh, nfhp->nfh_len, cred, p, &dp);
321			}
322		} else {
323			error = EIO;
324		}
325		newnfs_copyincred(cred, &op->nfso_cred);
326	    } else if (ret == NFSCLOPEN_SETCRED)
327		/*
328		 * This is a new local open on a delegation. It needs
329		 * to have credentials so that an open can be done
330		 * against the server during recovery.
331		 */
332		newnfs_copyincred(cred, &op->nfso_cred);
333
334	    /*
335	     * nfso_opencnt is the count of how many VOP_OPEN()s have
336	     * been done on this Open successfully and a VOP_CLOSE()
337	     * is expected for each of these.
338	     * If error is non-zero, don't increment it, since the Open
339	     * hasn't succeeded yet.
340	     */
341	    if (!error)
342		op->nfso_opencnt++;
343	    nfscl_openrelease(op, error, newone);
344	    if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
345		error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
346		error == NFSERR_BADSESSION) {
347		(void) nfs_catnap(PZERO, error, "nfs_open");
348	    } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
349		&& clidrev != 0) {
350		expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
351		retrycnt++;
352	    }
353	} while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
354	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
355	    error == NFSERR_BADSESSION ||
356	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
357	     expireret == 0 && clidrev != 0 && retrycnt < 4));
358	if (error && retrycnt >= 4)
359		error = EIO;
360	return (error);
361}
362
363/*
364 * the actual open rpc
365 */
366APPLESTATIC int
367nfsrpc_openrpc(struct nfsmount *nmp, vnode_t vp, u_int8_t *nfhp, int fhlen,
368    u_int8_t *newfhp, int newfhlen, u_int32_t mode, struct nfsclopen *op,
369    u_int8_t *name, int namelen, struct nfscldeleg **dpp,
370    int reclaim, u_int32_t delegtype, struct ucred *cred, NFSPROC_T *p,
371    int syscred, int recursed)
372{
373	u_int32_t *tl;
374	struct nfsrv_descript nfsd, *nd = &nfsd;
375	struct nfscldeleg *dp, *ndp = NULL;
376	struct nfsvattr nfsva;
377	u_int32_t rflags, deleg;
378	nfsattrbit_t attrbits;
379	int error, ret, acesize, limitby;
380
381	dp = *dpp;
382	*dpp = NULL;
383	nfscl_reqstart(nd, NFSPROC_OPEN, nmp, nfhp, fhlen, NULL, NULL);
384	NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
385	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
386	*tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
387	*tl++ = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
388	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
389	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
390	(void) nfsm_strtom(nd, op->nfso_own->nfsow_owner, NFSV4CL_LOCKNAMELEN);
391	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
392	*tl++ = txdr_unsigned(NFSV4OPEN_NOCREATE);
393	if (reclaim) {
394		*tl = txdr_unsigned(NFSV4OPEN_CLAIMPREVIOUS);
395		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
396		*tl = txdr_unsigned(delegtype);
397	} else {
398		if (dp != NULL) {
399			*tl = txdr_unsigned(NFSV4OPEN_CLAIMDELEGATECUR);
400			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
401			if (NFSHASNFSV4N(nmp))
402				*tl++ = 0;
403			else
404				*tl++ = dp->nfsdl_stateid.seqid;
405			*tl++ = dp->nfsdl_stateid.other[0];
406			*tl++ = dp->nfsdl_stateid.other[1];
407			*tl = dp->nfsdl_stateid.other[2];
408		} else {
409			*tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
410		}
411		(void) nfsm_strtom(nd, name, namelen);
412	}
413	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
414	*tl = txdr_unsigned(NFSV4OP_GETATTR);
415	NFSZERO_ATTRBIT(&attrbits);
416	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_CHANGE);
417	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TIMEMODIFY);
418	(void) nfsrv_putattrbit(nd, &attrbits);
419	if (syscred)
420		nd->nd_flag |= ND_USEGSSNAME;
421	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
422	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
423	if (error)
424		return (error);
425	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
426	if (!nd->nd_repstat) {
427		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
428		    6 * NFSX_UNSIGNED);
429		op->nfso_stateid.seqid = *tl++;
430		op->nfso_stateid.other[0] = *tl++;
431		op->nfso_stateid.other[1] = *tl++;
432		op->nfso_stateid.other[2] = *tl;
433		rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
434		error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
435		if (error)
436			goto nfsmout;
437		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
438		deleg = fxdr_unsigned(u_int32_t, *tl);
439		if (deleg == NFSV4OPEN_DELEGATEREAD ||
440		    deleg == NFSV4OPEN_DELEGATEWRITE) {
441			if (!(op->nfso_own->nfsow_clp->nfsc_flags &
442			      NFSCLFLAGS_FIRSTDELEG))
443				op->nfso_own->nfsow_clp->nfsc_flags |=
444				  (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
445			MALLOC(ndp, struct nfscldeleg *,
446			    sizeof (struct nfscldeleg) + newfhlen,
447			    M_NFSCLDELEG, M_WAITOK);
448			LIST_INIT(&ndp->nfsdl_owner);
449			LIST_INIT(&ndp->nfsdl_lock);
450			ndp->nfsdl_clp = op->nfso_own->nfsow_clp;
451			ndp->nfsdl_fhlen = newfhlen;
452			NFSBCOPY(newfhp, ndp->nfsdl_fh, newfhlen);
453			newnfs_copyincred(cred, &ndp->nfsdl_cred);
454			nfscl_lockinit(&ndp->nfsdl_rwlock);
455			NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
456			    NFSX_UNSIGNED);
457			ndp->nfsdl_stateid.seqid = *tl++;
458			ndp->nfsdl_stateid.other[0] = *tl++;
459			ndp->nfsdl_stateid.other[1] = *tl++;
460			ndp->nfsdl_stateid.other[2] = *tl++;
461			ret = fxdr_unsigned(int, *tl);
462			if (deleg == NFSV4OPEN_DELEGATEWRITE) {
463				ndp->nfsdl_flags = NFSCLDL_WRITE;
464				/*
465				 * Indicates how much the file can grow.
466				 */
467				NFSM_DISSECT(tl, u_int32_t *,
468				    3 * NFSX_UNSIGNED);
469				limitby = fxdr_unsigned(int, *tl++);
470				switch (limitby) {
471				case NFSV4OPEN_LIMITSIZE:
472					ndp->nfsdl_sizelimit = fxdr_hyper(tl);
473					break;
474				case NFSV4OPEN_LIMITBLOCKS:
475					ndp->nfsdl_sizelimit =
476					    fxdr_unsigned(u_int64_t, *tl++);
477					ndp->nfsdl_sizelimit *=
478					    fxdr_unsigned(u_int64_t, *tl);
479					break;
480				default:
481					error = NFSERR_BADXDR;
482					goto nfsmout;
483				};
484			} else {
485				ndp->nfsdl_flags = NFSCLDL_READ;
486			}
487			if (ret)
488				ndp->nfsdl_flags |= NFSCLDL_RECALL;
489			error = nfsrv_dissectace(nd, &ndp->nfsdl_ace, &ret,
490			    &acesize, p);
491			if (error)
492				goto nfsmout;
493		} else if (deleg != NFSV4OPEN_DELEGATENONE) {
494			error = NFSERR_BADXDR;
495			goto nfsmout;
496		}
497		NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
498		error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
499		    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
500		    NULL, NULL, NULL, p, cred);
501		if (error)
502			goto nfsmout;
503		if (ndp != NULL) {
504			ndp->nfsdl_change = nfsva.na_filerev;
505			ndp->nfsdl_modtime = nfsva.na_mtime;
506			ndp->nfsdl_flags |= NFSCLDL_MODTIMESET;
507		}
508		if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM)) {
509		    do {
510			ret = nfsrpc_openconfirm(vp, newfhp, newfhlen, op,
511			    cred, p);
512			if (ret == NFSERR_DELAY)
513			    (void) nfs_catnap(PZERO, ret, "nfs_open");
514		    } while (ret == NFSERR_DELAY);
515		    error = ret;
516		}
517		if ((rflags & NFSV4OPEN_LOCKTYPEPOSIX) ||
518		    nfscl_assumeposixlocks)
519		    op->nfso_posixlock = 1;
520		else
521		    op->nfso_posixlock = 0;
522
523		/*
524		 * If the server is handing out delegations, but we didn't
525		 * get one because an OpenConfirm was required, try the
526		 * Open again, to get a delegation. This is a harmless no-op,
527		 * from a server's point of view.
528		 */
529		if (!reclaim && (rflags & NFSV4OPEN_RESULTCONFIRM) &&
530		    (op->nfso_own->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG)
531		    && !error && dp == NULL && ndp == NULL && !recursed) {
532		    do {
533			ret = nfsrpc_openrpc(nmp, vp, nfhp, fhlen, newfhp,
534			    newfhlen, mode, op, name, namelen, &ndp, 0, 0x0,
535			    cred, p, syscred, 1);
536			if (ret == NFSERR_DELAY)
537			    (void) nfs_catnap(PZERO, ret, "nfs_open2");
538		    } while (ret == NFSERR_DELAY);
539		    if (ret) {
540			if (ndp != NULL)
541				FREE((caddr_t)ndp, M_NFSCLDELEG);
542			if (ret == NFSERR_STALECLIENTID ||
543			    ret == NFSERR_STALEDONTRECOVER ||
544			    ret == NFSERR_BADSESSION)
545				error = ret;
546		    }
547		}
548	}
549	if (nd->nd_repstat != 0 && error == 0)
550		error = nd->nd_repstat;
551	if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
552		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
553nfsmout:
554	if (!error)
555		*dpp = ndp;
556	else if (ndp != NULL)
557		FREE((caddr_t)ndp, M_NFSCLDELEG);
558	mbuf_freem(nd->nd_mrep);
559	return (error);
560}
561
562/*
563 * open downgrade rpc
564 */
565APPLESTATIC int
566nfsrpc_opendowngrade(vnode_t vp, u_int32_t mode, struct nfsclopen *op,
567    struct ucred *cred, NFSPROC_T *p)
568{
569	u_int32_t *tl;
570	struct nfsrv_descript nfsd, *nd = &nfsd;
571	int error;
572
573	NFSCL_REQSTART(nd, NFSPROC_OPENDOWNGRADE, vp);
574	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 3 * NFSX_UNSIGNED);
575	if (NFSHASNFSV4N(VFSTONFS(vnode_mount(vp))))
576		*tl++ = 0;
577	else
578		*tl++ = op->nfso_stateid.seqid;
579	*tl++ = op->nfso_stateid.other[0];
580	*tl++ = op->nfso_stateid.other[1];
581	*tl++ = op->nfso_stateid.other[2];
582	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
583	*tl++ = txdr_unsigned(mode & NFSV4OPEN_ACCESSBOTH);
584	*tl = txdr_unsigned((mode >> NFSLCK_SHIFT) & NFSV4OPEN_DENYBOTH);
585	error = nfscl_request(nd, vp, p, cred, NULL);
586	if (error)
587		return (error);
588	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
589	if (!nd->nd_repstat) {
590		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
591		op->nfso_stateid.seqid = *tl++;
592		op->nfso_stateid.other[0] = *tl++;
593		op->nfso_stateid.other[1] = *tl++;
594		op->nfso_stateid.other[2] = *tl;
595	}
596	if (nd->nd_repstat && error == 0)
597		error = nd->nd_repstat;
598	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
599		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
600nfsmout:
601	mbuf_freem(nd->nd_mrep);
602	return (error);
603}
604
605/*
606 * V4 Close operation.
607 */
608APPLESTATIC int
609nfsrpc_close(vnode_t vp, int doclose, NFSPROC_T *p)
610{
611	struct nfsclclient *clp;
612	int error;
613
614	if (vnode_vtype(vp) != VREG)
615		return (0);
616	if (doclose)
617		error = nfscl_doclose(vp, &clp, p);
618	else
619		error = nfscl_getclose(vp, &clp);
620	if (error)
621		return (error);
622
623	nfscl_clientrelease(clp);
624	return (0);
625}
626
627/*
628 * Close the open.
629 */
630APPLESTATIC void
631nfsrpc_doclose(struct nfsmount *nmp, struct nfsclopen *op, NFSPROC_T *p)
632{
633	struct nfsrv_descript nfsd, *nd = &nfsd;
634	struct nfscllockowner *lp, *nlp;
635	struct nfscllock *lop, *nlop;
636	struct ucred *tcred;
637	u_int64_t off = 0, len = 0;
638	u_int32_t type = NFSV4LOCKT_READ;
639	int error, do_unlock, trycnt;
640
641	tcred = newnfs_getcred();
642	newnfs_copycred(&op->nfso_cred, tcred);
643	/*
644	 * (Theoretically this could be done in the same
645	 *  compound as the close, but having multiple
646	 *  sequenced Ops in the same compound might be
647	 *  too scary for some servers.)
648	 */
649	if (op->nfso_posixlock) {
650		off = 0;
651		len = NFS64BITSSET;
652		type = NFSV4LOCKT_READ;
653	}
654
655	/*
656	 * Since this function is only called from VOP_INACTIVE(), no
657	 * other thread will be manipulating this Open. As such, the
658	 * lock lists are not being changed by other threads, so it should
659	 * be safe to do this without locking.
660	 */
661	LIST_FOREACH(lp, &op->nfso_lock, nfsl_list) {
662		do_unlock = 1;
663		LIST_FOREACH_SAFE(lop, &lp->nfsl_lock, nfslo_list, nlop) {
664			if (op->nfso_posixlock == 0) {
665				off = lop->nfslo_first;
666				len = lop->nfslo_end - lop->nfslo_first;
667				if (lop->nfslo_type == F_WRLCK)
668					type = NFSV4LOCKT_WRITE;
669				else
670					type = NFSV4LOCKT_READ;
671			}
672			if (do_unlock) {
673				trycnt = 0;
674				do {
675					error = nfsrpc_locku(nd, nmp, lp, off,
676					    len, type, tcred, p, 0);
677					if ((nd->nd_repstat == NFSERR_GRACE ||
678					    nd->nd_repstat == NFSERR_DELAY) &&
679					    error == 0)
680						(void) nfs_catnap(PZERO,
681						    (int)nd->nd_repstat,
682						    "nfs_close");
683				} while ((nd->nd_repstat == NFSERR_GRACE ||
684				    nd->nd_repstat == NFSERR_DELAY) &&
685				    error == 0 && trycnt++ < 5);
686				if (op->nfso_posixlock)
687					do_unlock = 0;
688			}
689			nfscl_freelock(lop, 0);
690		}
691		/*
692		 * Do a ReleaseLockOwner.
693		 * The lock owner name nfsl_owner may be used by other opens for
694		 * other files but the lock_owner4 name that nfsrpc_rellockown()
695		 * puts on the wire has the file handle for this file appended
696		 * to it, so it can be done now.
697		 */
698		(void)nfsrpc_rellockown(nmp, lp, lp->nfsl_open->nfso_fh,
699		    lp->nfsl_open->nfso_fhlen, tcred, p);
700	}
701
702	/*
703	 * There could be other Opens for different files on the same
704	 * OpenOwner, so locking is required.
705	 */
706	NFSLOCKCLSTATE();
707	nfscl_lockexcl(&op->nfso_own->nfsow_rwlock, NFSCLSTATEMUTEXPTR);
708	NFSUNLOCKCLSTATE();
709	do {
710		error = nfscl_tryclose(op, tcred, nmp, p);
711		if (error == NFSERR_GRACE)
712			(void) nfs_catnap(PZERO, error, "nfs_close");
713	} while (error == NFSERR_GRACE);
714	NFSLOCKCLSTATE();
715	nfscl_lockunlock(&op->nfso_own->nfsow_rwlock);
716
717	LIST_FOREACH_SAFE(lp, &op->nfso_lock, nfsl_list, nlp)
718		nfscl_freelockowner(lp, 0);
719	nfscl_freeopen(op, 0);
720	NFSUNLOCKCLSTATE();
721	NFSFREECRED(tcred);
722}
723
724/*
725 * The actual Close RPC.
726 */
727APPLESTATIC int
728nfsrpc_closerpc(struct nfsrv_descript *nd, struct nfsmount *nmp,
729    struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p,
730    int syscred)
731{
732	u_int32_t *tl;
733	int error;
734
735	nfscl_reqstart(nd, NFSPROC_CLOSE, nmp, op->nfso_fh,
736	    op->nfso_fhlen, NULL, NULL);
737	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
738	*tl++ = txdr_unsigned(op->nfso_own->nfsow_seqid);
739	if (NFSHASNFSV4N(nmp))
740		*tl++ = 0;
741	else
742		*tl++ = op->nfso_stateid.seqid;
743	*tl++ = op->nfso_stateid.other[0];
744	*tl++ = op->nfso_stateid.other[1];
745	*tl = op->nfso_stateid.other[2];
746	if (syscred)
747		nd->nd_flag |= ND_USEGSSNAME;
748	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
749	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
750	if (error)
751		return (error);
752	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
753	if (nd->nd_repstat == 0)
754		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
755	error = nd->nd_repstat;
756	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
757		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
758nfsmout:
759	mbuf_freem(nd->nd_mrep);
760	return (error);
761}
762
763/*
764 * V4 Open Confirm RPC.
765 */
766APPLESTATIC int
767nfsrpc_openconfirm(vnode_t vp, u_int8_t *nfhp, int fhlen,
768    struct nfsclopen *op, struct ucred *cred, NFSPROC_T *p)
769{
770	u_int32_t *tl;
771	struct nfsrv_descript nfsd, *nd = &nfsd;
772	struct nfsmount *nmp;
773	int error;
774
775	nmp = VFSTONFS(vnode_mount(vp));
776	if (NFSHASNFSV4N(nmp))
777		return (0);		/* No confirmation for NFSv4.1. */
778	nfscl_reqstart(nd, NFSPROC_OPENCONFIRM, nmp, nfhp, fhlen, NULL, NULL);
779	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED + NFSX_STATEID);
780	*tl++ = op->nfso_stateid.seqid;
781	*tl++ = op->nfso_stateid.other[0];
782	*tl++ = op->nfso_stateid.other[1];
783	*tl++ = op->nfso_stateid.other[2];
784	*tl = txdr_unsigned(op->nfso_own->nfsow_seqid);
785	error = nfscl_request(nd, vp, p, cred, NULL);
786	if (error)
787		return (error);
788	NFSCL_INCRSEQID(op->nfso_own->nfsow_seqid, nd);
789	if (!nd->nd_repstat) {
790		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
791		op->nfso_stateid.seqid = *tl++;
792		op->nfso_stateid.other[0] = *tl++;
793		op->nfso_stateid.other[1] = *tl++;
794		op->nfso_stateid.other[2] = *tl;
795	}
796	error = nd->nd_repstat;
797	if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
798		nfscl_initiate_recovery(op->nfso_own->nfsow_clp);
799nfsmout:
800	mbuf_freem(nd->nd_mrep);
801	return (error);
802}
803
804/*
805 * Do the setclientid and setclientid confirm RPCs. Called from nfs_statfs()
806 * when a mount has just occurred and when the server replies NFSERR_EXPIRED.
807 */
808APPLESTATIC int
809nfsrpc_setclient(struct nfsmount *nmp, struct nfsclclient *clp, int reclaim,
810    struct ucred *cred, NFSPROC_T *p)
811{
812	u_int32_t *tl;
813	struct nfsrv_descript nfsd;
814	struct nfsrv_descript *nd = &nfsd;
815	nfsattrbit_t attrbits;
816	u_int8_t *cp = NULL, *cp2, addr[INET6_ADDRSTRLEN + 9];
817	u_short port;
818	int error, isinet6 = 0, callblen;
819	nfsquad_t confirm;
820	u_int32_t lease;
821	static u_int32_t rev = 0;
822	struct nfsclds *dsp, *ndsp, *tdsp;
823
824	if (nfsboottime.tv_sec == 0)
825		NFSSETBOOTTIME(nfsboottime);
826	clp->nfsc_rev = rev++;
827	if (NFSHASNFSV4N(nmp)) {
828		error = nfsrpc_exchangeid(nmp, clp, &nmp->nm_sockreq,
829		    NFSV4EXCH_USEPNFSMDS | NFSV4EXCH_USENONPNFS, &dsp, cred, p);
830		NFSCL_DEBUG(1, "aft exch=%d\n", error);
831		if (error == 0) {
832			error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
833			    &nmp->nm_sockreq,
834			    dsp->nfsclds_sess.nfsess_sequenceid, 1, cred, p);
835			if (error == 0) {
836				NFSLOCKMNT(nmp);
837				TAILQ_FOREACH_SAFE(tdsp, &nmp->nm_sess,
838				    nfsclds_list, ndsp)
839					nfscl_freenfsclds(tdsp);
840				TAILQ_INIT(&nmp->nm_sess);
841				TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp,
842				    nfsclds_list);
843				NFSUNLOCKMNT(nmp);
844			} else
845				nfscl_freenfsclds(dsp);
846			NFSCL_DEBUG(1, "aft createsess=%d\n", error);
847		}
848		if (error == 0 && reclaim == 0) {
849			error = nfsrpc_reclaimcomplete(nmp, cred, p);
850			NFSCL_DEBUG(1, "aft reclaimcomp=%d\n", error);
851			if (error == NFSERR_COMPLETEALREADY ||
852			    error == NFSERR_NOTSUPP)
853				/* Ignore this error. */
854				error = 0;
855		}
856		return (error);
857	}
858
859	/*
860	 * Allocate a single session structure for NFSv4.0, because some of
861	 * the fields are used by NFSv4.0 although it doesn't do a session.
862	 */
863	dsp = malloc(sizeof(struct nfsclds), M_NFSCLDS, M_WAITOK | M_ZERO);
864	mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
865	mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession", NULL, MTX_DEF);
866	NFSLOCKMNT(nmp);
867	TAILQ_INSERT_HEAD(&nmp->nm_sess, dsp, nfsclds_list);
868	NFSUNLOCKMNT(nmp);
869
870	nfscl_reqstart(nd, NFSPROC_SETCLIENTID, nmp, NULL, 0, NULL, NULL);
871	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
872	*tl++ = txdr_unsigned(nfsboottime.tv_sec);
873	*tl = txdr_unsigned(clp->nfsc_rev);
874	(void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
875
876	/*
877	 * set up the callback address
878	 */
879	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
880	*tl = txdr_unsigned(NFS_CALLBCKPROG);
881	callblen = strlen(nfsv4_callbackaddr);
882	if (callblen == 0)
883		cp = nfscl_getmyip(nmp, &isinet6);
884	if (nfscl_enablecallb && nfs_numnfscbd > 0 &&
885	    (callblen > 0 || cp != NULL)) {
886		port = htons(nfsv4_cbport);
887		cp2 = (u_int8_t *)&port;
888#ifdef INET6
889		if ((callblen > 0 &&
890		     strchr(nfsv4_callbackaddr, ':')) || isinet6) {
891			char ip6buf[INET6_ADDRSTRLEN], *ip6add;
892
893			(void) nfsm_strtom(nd, "tcp6", 4);
894			if (callblen == 0) {
895				ip6_sprintf(ip6buf, (struct in6_addr *)cp);
896				ip6add = ip6buf;
897			} else {
898				ip6add = nfsv4_callbackaddr;
899			}
900			snprintf(addr, INET6_ADDRSTRLEN + 9, "%s.%d.%d",
901			    ip6add, cp2[0], cp2[1]);
902		} else
903#endif
904		{
905			(void) nfsm_strtom(nd, "tcp", 3);
906			if (callblen == 0)
907				snprintf(addr, INET6_ADDRSTRLEN + 9,
908				    "%d.%d.%d.%d.%d.%d", cp[0], cp[1],
909				    cp[2], cp[3], cp2[0], cp2[1]);
910			else
911				snprintf(addr, INET6_ADDRSTRLEN + 9,
912				    "%s.%d.%d", nfsv4_callbackaddr,
913				    cp2[0], cp2[1]);
914		}
915		(void) nfsm_strtom(nd, addr, strlen(addr));
916	} else {
917		(void) nfsm_strtom(nd, "tcp", 3);
918		(void) nfsm_strtom(nd, "0.0.0.0.0.0", 11);
919	}
920	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
921	*tl = txdr_unsigned(clp->nfsc_cbident);
922	nd->nd_flag |= ND_USEGSSNAME;
923	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
924		NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
925	if (error)
926		return (error);
927	if (nd->nd_repstat == 0) {
928	    NFSM_DISSECT(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
929	    NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0] = *tl++;
930	    NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1] = *tl++;
931	    confirm.lval[0] = *tl++;
932	    confirm.lval[1] = *tl;
933	    mbuf_freem(nd->nd_mrep);
934	    nd->nd_mrep = NULL;
935
936	    /*
937	     * and confirm it.
938	     */
939	    nfscl_reqstart(nd, NFSPROC_SETCLIENTIDCFRM, nmp, NULL, 0, NULL,
940		NULL);
941	    NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
942	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
943	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
944	    *tl++ = confirm.lval[0];
945	    *tl = confirm.lval[1];
946	    nd->nd_flag |= ND_USEGSSNAME;
947	    error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
948		cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
949	    if (error)
950		return (error);
951	    mbuf_freem(nd->nd_mrep);
952	    nd->nd_mrep = NULL;
953	    if (nd->nd_repstat == 0) {
954		nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, nmp->nm_fh,
955		    nmp->nm_fhsize, NULL, NULL);
956		NFSZERO_ATTRBIT(&attrbits);
957		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
958		(void) nfsrv_putattrbit(nd, &attrbits);
959		nd->nd_flag |= ND_USEGSSNAME;
960		error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p,
961		    cred, NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
962		if (error)
963		    return (error);
964		if (nd->nd_repstat == 0) {
965		    error = nfsv4_loadattr(nd, NULL, NULL, NULL, NULL, 0, NULL,
966			NULL, NULL, NULL, NULL, 0, NULL, &lease, NULL, p, cred);
967		    if (error)
968			goto nfsmout;
969		    clp->nfsc_renew = NFSCL_RENEW(lease);
970		    clp->nfsc_expire = NFSD_MONOSEC + clp->nfsc_renew;
971		    clp->nfsc_clientidrev++;
972		    if (clp->nfsc_clientidrev == 0)
973			clp->nfsc_clientidrev++;
974		}
975	    }
976	}
977	error = nd->nd_repstat;
978nfsmout:
979	mbuf_freem(nd->nd_mrep);
980	return (error);
981}
982
983/*
984 * nfs getattr call.
985 */
986APPLESTATIC int
987nfsrpc_getattr(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
988    struct nfsvattr *nap, void *stuff)
989{
990	struct nfsrv_descript nfsd, *nd = &nfsd;
991	int error;
992	nfsattrbit_t attrbits;
993
994	NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
995	if (nd->nd_flag & ND_NFSV4) {
996		NFSGETATTR_ATTRBIT(&attrbits);
997		(void) nfsrv_putattrbit(nd, &attrbits);
998	}
999	error = nfscl_request(nd, vp, p, cred, stuff);
1000	if (error)
1001		return (error);
1002	if (!nd->nd_repstat)
1003		error = nfsm_loadattr(nd, nap);
1004	else
1005		error = nd->nd_repstat;
1006	mbuf_freem(nd->nd_mrep);
1007	return (error);
1008}
1009
1010/*
1011 * nfs getattr call with non-vnode arguemnts.
1012 */
1013APPLESTATIC int
1014nfsrpc_getattrnovp(struct nfsmount *nmp, u_int8_t *fhp, int fhlen, int syscred,
1015    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, u_int64_t *xidp,
1016    uint32_t *leasep)
1017{
1018	struct nfsrv_descript nfsd, *nd = &nfsd;
1019	int error, vers = NFS_VER2;
1020	nfsattrbit_t attrbits;
1021
1022	nfscl_reqstart(nd, NFSPROC_GETATTR, nmp, fhp, fhlen, NULL, NULL);
1023	if (nd->nd_flag & ND_NFSV4) {
1024		vers = NFS_VER4;
1025		NFSGETATTR_ATTRBIT(&attrbits);
1026		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_LEASETIME);
1027		(void) nfsrv_putattrbit(nd, &attrbits);
1028	} else if (nd->nd_flag & ND_NFSV3) {
1029		vers = NFS_VER3;
1030	}
1031	if (syscred)
1032		nd->nd_flag |= ND_USEGSSNAME;
1033	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
1034	    NFS_PROG, vers, NULL, 1, xidp, NULL);
1035	if (error)
1036		return (error);
1037	if (nd->nd_repstat == 0) {
1038		if ((nd->nd_flag & ND_NFSV4) != 0)
1039			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
1040			    NULL, NULL, NULL, NULL, NULL, 0, NULL, leasep, NULL,
1041			    NULL, NULL);
1042		else
1043			error = nfsm_loadattr(nd, nap);
1044	} else
1045		error = nd->nd_repstat;
1046	mbuf_freem(nd->nd_mrep);
1047	return (error);
1048}
1049
1050/*
1051 * Do an nfs setattr operation.
1052 */
1053APPLESTATIC int
1054nfsrpc_setattr(vnode_t vp, struct vattr *vap, NFSACL_T *aclp,
1055    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *rnap, int *attrflagp,
1056    void *stuff)
1057{
1058	int error, expireret = 0, openerr, retrycnt;
1059	u_int32_t clidrev = 0, mode;
1060	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1061	struct nfsfh *nfhp;
1062	nfsv4stateid_t stateid;
1063	void *lckp;
1064
1065	if (nmp->nm_clp != NULL)
1066		clidrev = nmp->nm_clp->nfsc_clientidrev;
1067	if (vap != NULL && NFSATTRISSET(u_quad_t, vap, va_size))
1068		mode = NFSV4OPEN_ACCESSWRITE;
1069	else
1070		mode = NFSV4OPEN_ACCESSREAD;
1071	retrycnt = 0;
1072	do {
1073		lckp = NULL;
1074		openerr = 1;
1075		if (NFSHASNFSV4(nmp)) {
1076			nfhp = VTONFS(vp)->n_fhp;
1077			error = nfscl_getstateid(vp, nfhp->nfh_fh,
1078			    nfhp->nfh_len, mode, 0, cred, p, &stateid, &lckp);
1079			if (error && vnode_vtype(vp) == VREG &&
1080			    (mode == NFSV4OPEN_ACCESSWRITE ||
1081			     nfstest_openallsetattr)) {
1082				/*
1083				 * No Open stateid, so try and open the file
1084				 * now.
1085				 */
1086				if (mode == NFSV4OPEN_ACCESSWRITE)
1087					openerr = nfsrpc_open(vp, FWRITE, cred,
1088					    p);
1089				else
1090					openerr = nfsrpc_open(vp, FREAD, cred,
1091					    p);
1092				if (!openerr)
1093					(void) nfscl_getstateid(vp,
1094					    nfhp->nfh_fh, nfhp->nfh_len,
1095					    mode, 0, cred, p, &stateid, &lckp);
1096			}
1097		}
1098		if (vap != NULL)
1099			error = nfsrpc_setattrrpc(vp, vap, &stateid, cred, p,
1100			    rnap, attrflagp, stuff);
1101		else
1102			error = nfsrpc_setaclrpc(vp, cred, p, aclp, &stateid,
1103			    stuff);
1104		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1105			nfscl_initiate_recovery(nmp->nm_clp);
1106		if (lckp != NULL)
1107			nfscl_lockderef(lckp);
1108		if (!openerr)
1109			(void) nfsrpc_close(vp, 0, p);
1110		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1111		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1112		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1113			(void) nfs_catnap(PZERO, error, "nfs_setattr");
1114		} else if ((error == NFSERR_EXPIRED ||
1115		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1116			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1117		}
1118		retrycnt++;
1119	} while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1120	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1121	    error == NFSERR_BADSESSION ||
1122	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1123	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1124	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1125	if (error && retrycnt >= 4)
1126		error = EIO;
1127	return (error);
1128}
1129
1130static int
1131nfsrpc_setattrrpc(vnode_t vp, struct vattr *vap,
1132    nfsv4stateid_t *stateidp, struct ucred *cred, NFSPROC_T *p,
1133    struct nfsvattr *rnap, int *attrflagp, void *stuff)
1134{
1135	u_int32_t *tl;
1136	struct nfsrv_descript nfsd, *nd = &nfsd;
1137	int error;
1138	nfsattrbit_t attrbits;
1139
1140	*attrflagp = 0;
1141	NFSCL_REQSTART(nd, NFSPROC_SETATTR, vp);
1142	if (nd->nd_flag & ND_NFSV4)
1143		nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1144	vap->va_type = vnode_vtype(vp);
1145	nfscl_fillsattr(nd, vap, vp, NFSSATTR_FULL, 0);
1146	if (nd->nd_flag & ND_NFSV3) {
1147		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1148		*tl = newnfs_false;
1149	} else if (nd->nd_flag & ND_NFSV4) {
1150		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1151		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1152		NFSGETATTR_ATTRBIT(&attrbits);
1153		(void) nfsrv_putattrbit(nd, &attrbits);
1154	}
1155	error = nfscl_request(nd, vp, p, cred, stuff);
1156	if (error)
1157		return (error);
1158	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1159		error = nfscl_wcc_data(nd, vp, rnap, attrflagp, NULL, stuff);
1160	if ((nd->nd_flag & ND_NFSV4) && !error)
1161		error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1162	if (!(nd->nd_flag & ND_NFSV3) && !nd->nd_repstat && !error)
1163		error = nfscl_postop_attr(nd, rnap, attrflagp, stuff);
1164	mbuf_freem(nd->nd_mrep);
1165	if (nd->nd_repstat && !error)
1166		error = nd->nd_repstat;
1167	return (error);
1168}
1169
1170/*
1171 * nfs lookup rpc
1172 */
1173APPLESTATIC int
1174nfsrpc_lookup(vnode_t dvp, char *name, int len, struct ucred *cred,
1175    NFSPROC_T *p, struct nfsvattr *dnap, struct nfsvattr *nap,
1176    struct nfsfh **nfhpp, int *attrflagp, int *dattrflagp, void *stuff)
1177{
1178	u_int32_t *tl;
1179	struct nfsrv_descript nfsd, *nd = &nfsd;
1180	struct nfsmount *nmp;
1181	struct nfsnode *np;
1182	struct nfsfh *nfhp;
1183	nfsattrbit_t attrbits;
1184	int error = 0, lookupp = 0;
1185
1186	*attrflagp = 0;
1187	*dattrflagp = 0;
1188	if (vnode_vtype(dvp) != VDIR)
1189		return (ENOTDIR);
1190	nmp = VFSTONFS(vnode_mount(dvp));
1191	if (len > NFS_MAXNAMLEN)
1192		return (ENAMETOOLONG);
1193	if (NFSHASNFSV4(nmp) && len == 1 &&
1194		name[0] == '.') {
1195		/*
1196		 * Just return the current dir's fh.
1197		 */
1198		np = VTONFS(dvp);
1199		MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1200			np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1201		nfhp->nfh_len = np->n_fhp->nfh_len;
1202		NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1203		*nfhpp = nfhp;
1204		return (0);
1205	}
1206	if (NFSHASNFSV4(nmp) && len == 2 &&
1207		name[0] == '.' && name[1] == '.') {
1208		lookupp = 1;
1209		NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, dvp);
1210	} else {
1211		NFSCL_REQSTART(nd, NFSPROC_LOOKUP, dvp);
1212		(void) nfsm_strtom(nd, name, len);
1213	}
1214	if (nd->nd_flag & ND_NFSV4) {
1215		NFSGETATTR_ATTRBIT(&attrbits);
1216		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1217		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
1218		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1219		(void) nfsrv_putattrbit(nd, &attrbits);
1220	}
1221	error = nfscl_request(nd, dvp, p, cred, stuff);
1222	if (error)
1223		return (error);
1224	if (nd->nd_repstat) {
1225		/*
1226		 * When an NFSv4 Lookupp returns ENOENT, it means that
1227		 * the lookup is at the root of an fs, so return this dir.
1228		 */
1229		if (nd->nd_repstat == NFSERR_NOENT && lookupp) {
1230		    np = VTONFS(dvp);
1231		    MALLOC(nfhp, struct nfsfh *, sizeof (struct nfsfh) +
1232			np->n_fhp->nfh_len, M_NFSFH, M_WAITOK);
1233		    nfhp->nfh_len = np->n_fhp->nfh_len;
1234		    NFSBCOPY(np->n_fhp->nfh_fh, nfhp->nfh_fh, nfhp->nfh_len);
1235		    *nfhpp = nfhp;
1236		    mbuf_freem(nd->nd_mrep);
1237		    return (0);
1238		}
1239		if (nd->nd_flag & ND_NFSV3)
1240		    error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1241		goto nfsmout;
1242	}
1243	if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
1244		NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1245		if (*(tl + 1)) {
1246			nd->nd_flag |= ND_NOMOREDATA;
1247			goto nfsmout;
1248		}
1249	}
1250	error = nfsm_getfh(nd, nfhpp);
1251	if (error)
1252		goto nfsmout;
1253
1254	error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1255	if ((nd->nd_flag & ND_NFSV3) && !error)
1256		error = nfscl_postop_attr(nd, dnap, dattrflagp, stuff);
1257nfsmout:
1258	mbuf_freem(nd->nd_mrep);
1259	if (!error && nd->nd_repstat)
1260		error = nd->nd_repstat;
1261	return (error);
1262}
1263
1264/*
1265 * Do a readlink rpc.
1266 */
1267APPLESTATIC int
1268nfsrpc_readlink(vnode_t vp, struct uio *uiop, struct ucred *cred,
1269    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1270{
1271	u_int32_t *tl;
1272	struct nfsrv_descript nfsd, *nd = &nfsd;
1273	struct nfsnode *np = VTONFS(vp);
1274	nfsattrbit_t attrbits;
1275	int error, len, cangetattr = 1;
1276
1277	*attrflagp = 0;
1278	NFSCL_REQSTART(nd, NFSPROC_READLINK, vp);
1279	if (nd->nd_flag & ND_NFSV4) {
1280		/*
1281		 * And do a Getattr op.
1282		 */
1283		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1284		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1285		NFSGETATTR_ATTRBIT(&attrbits);
1286		(void) nfsrv_putattrbit(nd, &attrbits);
1287	}
1288	error = nfscl_request(nd, vp, p, cred, stuff);
1289	if (error)
1290		return (error);
1291	if (nd->nd_flag & ND_NFSV3)
1292		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1293	if (!nd->nd_repstat && !error) {
1294		NFSM_STRSIZ(len, NFS_MAXPATHLEN);
1295		/*
1296		 * This seems weird to me, but must have been added to
1297		 * FreeBSD for some reason. The only thing I can think of
1298		 * is that there was/is some server that replies with
1299		 * more link data than it should?
1300		 */
1301		if (len == NFS_MAXPATHLEN) {
1302			NFSLOCKNODE(np);
1303			if (np->n_size > 0 && np->n_size < NFS_MAXPATHLEN) {
1304				len = np->n_size;
1305				cangetattr = 0;
1306			}
1307			NFSUNLOCKNODE(np);
1308		}
1309		error = nfsm_mbufuio(nd, uiop, len);
1310		if ((nd->nd_flag & ND_NFSV4) && !error && cangetattr)
1311			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1312	}
1313	if (nd->nd_repstat && !error)
1314		error = nd->nd_repstat;
1315nfsmout:
1316	mbuf_freem(nd->nd_mrep);
1317	return (error);
1318}
1319
1320/*
1321 * Read operation.
1322 */
1323APPLESTATIC int
1324nfsrpc_read(vnode_t vp, struct uio *uiop, struct ucred *cred,
1325    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1326{
1327	int error, expireret = 0, retrycnt;
1328	u_int32_t clidrev = 0;
1329	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1330	struct nfsnode *np = VTONFS(vp);
1331	struct ucred *newcred;
1332	struct nfsfh *nfhp = NULL;
1333	nfsv4stateid_t stateid;
1334	void *lckp;
1335
1336	if (nmp->nm_clp != NULL)
1337		clidrev = nmp->nm_clp->nfsc_clientidrev;
1338	newcred = cred;
1339	if (NFSHASNFSV4(nmp)) {
1340		nfhp = np->n_fhp;
1341		newcred = NFSNEWCRED(cred);
1342	}
1343	retrycnt = 0;
1344	do {
1345		lckp = NULL;
1346		if (NFSHASNFSV4(nmp))
1347			(void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1348			    NFSV4OPEN_ACCESSREAD, 0, newcred, p, &stateid,
1349			    &lckp);
1350		error = nfsrpc_readrpc(vp, uiop, newcred, &stateid, p, nap,
1351		    attrflagp, stuff);
1352		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1353			nfscl_initiate_recovery(nmp->nm_clp);
1354		if (lckp != NULL)
1355			nfscl_lockderef(lckp);
1356		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1357		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1358		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1359			(void) nfs_catnap(PZERO, error, "nfs_read");
1360		} else if ((error == NFSERR_EXPIRED ||
1361		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1362			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1363		}
1364		retrycnt++;
1365	} while (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1366	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1367	    error == NFSERR_BADSESSION ||
1368	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1369	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1370	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1371	if (error && retrycnt >= 4)
1372		error = EIO;
1373	if (NFSHASNFSV4(nmp))
1374		NFSFREECRED(newcred);
1375	return (error);
1376}
1377
1378/*
1379 * The actual read RPC.
1380 */
1381static int
1382nfsrpc_readrpc(vnode_t vp, struct uio *uiop, struct ucred *cred,
1383    nfsv4stateid_t *stateidp, NFSPROC_T *p, struct nfsvattr *nap,
1384    int *attrflagp, void *stuff)
1385{
1386	u_int32_t *tl;
1387	int error = 0, len, retlen, tsiz, eof = 0;
1388	struct nfsrv_descript nfsd;
1389	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1390	struct nfsrv_descript *nd = &nfsd;
1391	int rsize;
1392	off_t tmp_off;
1393
1394	*attrflagp = 0;
1395	tsiz = uio_uio_resid(uiop);
1396	tmp_off = uiop->uio_offset + tsiz;
1397	NFSLOCKMNT(nmp);
1398	if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1399		NFSUNLOCKMNT(nmp);
1400		return (EFBIG);
1401	}
1402	rsize = nmp->nm_rsize;
1403	NFSUNLOCKMNT(nmp);
1404	nd->nd_mrep = NULL;
1405	while (tsiz > 0) {
1406		*attrflagp = 0;
1407		len = (tsiz > rsize) ? rsize : tsiz;
1408		NFSCL_REQSTART(nd, NFSPROC_READ, vp);
1409		if (nd->nd_flag & ND_NFSV4)
1410			nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1411		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED * 3);
1412		if (nd->nd_flag & ND_NFSV2) {
1413			*tl++ = txdr_unsigned(uiop->uio_offset);
1414			*tl++ = txdr_unsigned(len);
1415			*tl = 0;
1416		} else {
1417			txdr_hyper(uiop->uio_offset, tl);
1418			*(tl + 2) = txdr_unsigned(len);
1419		}
1420		/*
1421		 * Since I can't do a Getattr for NFSv4 for Write, there
1422		 * doesn't seem any point in doing one here, either.
1423		 * (See the comment in nfsrpc_writerpc() for more info.)
1424		 */
1425		error = nfscl_request(nd, vp, p, cred, stuff);
1426		if (error)
1427			return (error);
1428		if (nd->nd_flag & ND_NFSV3) {
1429			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
1430		} else if (!nd->nd_repstat && (nd->nd_flag & ND_NFSV2)) {
1431			error = nfsm_loadattr(nd, nap);
1432			if (!error)
1433				*attrflagp = 1;
1434		}
1435		if (nd->nd_repstat || error) {
1436			if (!error)
1437				error = nd->nd_repstat;
1438			goto nfsmout;
1439		}
1440		if (nd->nd_flag & ND_NFSV3) {
1441			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1442			eof = fxdr_unsigned(int, *(tl + 1));
1443		} else if (nd->nd_flag & ND_NFSV4) {
1444			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
1445			eof = fxdr_unsigned(int, *tl);
1446		}
1447		NFSM_STRSIZ(retlen, len);
1448		error = nfsm_mbufuio(nd, uiop, retlen);
1449		if (error)
1450			goto nfsmout;
1451		mbuf_freem(nd->nd_mrep);
1452		nd->nd_mrep = NULL;
1453		tsiz -= retlen;
1454		if (!(nd->nd_flag & ND_NFSV2)) {
1455			if (eof || retlen == 0)
1456				tsiz = 0;
1457		} else if (retlen < len)
1458			tsiz = 0;
1459	}
1460	return (0);
1461nfsmout:
1462	if (nd->nd_mrep != NULL)
1463		mbuf_freem(nd->nd_mrep);
1464	return (error);
1465}
1466
1467/*
1468 * nfs write operation
1469 * When called_from_strategy != 0, it should return EIO for an error that
1470 * indicates recovery is in progress, so that the buffer will be left
1471 * dirty and be written back to the server later. If it loops around,
1472 * the recovery thread could get stuck waiting for the buffer and recovery
1473 * will then deadlock.
1474 */
1475APPLESTATIC int
1476nfsrpc_write(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
1477    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
1478    void *stuff, int called_from_strategy)
1479{
1480	int error, expireret = 0, retrycnt, nostateid;
1481	u_int32_t clidrev = 0;
1482	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1483	struct nfsnode *np = VTONFS(vp);
1484	struct ucred *newcred;
1485	struct nfsfh *nfhp = NULL;
1486	nfsv4stateid_t stateid;
1487	void *lckp;
1488
1489	*must_commit = 0;
1490	if (nmp->nm_clp != NULL)
1491		clidrev = nmp->nm_clp->nfsc_clientidrev;
1492	newcred = cred;
1493	if (NFSHASNFSV4(nmp)) {
1494		newcred = NFSNEWCRED(cred);
1495		nfhp = np->n_fhp;
1496	}
1497	retrycnt = 0;
1498	do {
1499		lckp = NULL;
1500		nostateid = 0;
1501		if (NFSHASNFSV4(nmp)) {
1502			(void)nfscl_getstateid(vp, nfhp->nfh_fh, nfhp->nfh_len,
1503			    NFSV4OPEN_ACCESSWRITE, 0, newcred, p, &stateid,
1504			    &lckp);
1505			if (stateid.other[0] == 0 && stateid.other[1] == 0 &&
1506			    stateid.other[2] == 0) {
1507				nostateid = 1;
1508				NFSCL_DEBUG(1, "stateid0 in write\n");
1509			}
1510		}
1511
1512		/*
1513		 * If there is no stateid for NFSv4, it means this is an
1514		 * extraneous write after close. Basically a poorly
1515		 * implemented buffer cache. Just don't do the write.
1516		 */
1517		if (nostateid)
1518			error = 0;
1519		else
1520			error = nfsrpc_writerpc(vp, uiop, iomode, must_commit,
1521			    newcred, &stateid, p, nap, attrflagp, stuff);
1522		if (error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION)
1523			nfscl_initiate_recovery(nmp->nm_clp);
1524		if (lckp != NULL)
1525			nfscl_lockderef(lckp);
1526		if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
1527		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1528		    error == NFSERR_OLDSTATEID || error == NFSERR_BADSESSION) {
1529			(void) nfs_catnap(PZERO, error, "nfs_write");
1530		} else if ((error == NFSERR_EXPIRED ||
1531		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1532			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1533		}
1534		retrycnt++;
1535	} while (error == NFSERR_GRACE || error == NFSERR_DELAY ||
1536	    ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1537	      error == NFSERR_STALEDONTRECOVER) && called_from_strategy == 0) ||
1538	    (error == NFSERR_OLDSTATEID && retrycnt < 20) ||
1539	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1540	     expireret == 0 && clidrev != 0 && retrycnt < 4));
1541	if (error != 0 && (retrycnt >= 4 ||
1542	    ((error == NFSERR_STALESTATEID || error == NFSERR_BADSESSION ||
1543	      error == NFSERR_STALEDONTRECOVER) && called_from_strategy != 0)))
1544		error = EIO;
1545	if (NFSHASNFSV4(nmp))
1546		NFSFREECRED(newcred);
1547	return (error);
1548}
1549
1550/*
1551 * The actual write RPC.
1552 */
1553static int
1554nfsrpc_writerpc(vnode_t vp, struct uio *uiop, int *iomode,
1555    int *must_commit, struct ucred *cred, nfsv4stateid_t *stateidp,
1556    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
1557{
1558	u_int32_t *tl;
1559	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
1560	struct nfsnode *np = VTONFS(vp);
1561	int error = 0, len, tsiz, rlen, commit, committed = NFSWRITE_FILESYNC;
1562	int wccflag = 0, wsize;
1563	int32_t backup;
1564	struct nfsrv_descript nfsd;
1565	struct nfsrv_descript *nd = &nfsd;
1566	nfsattrbit_t attrbits;
1567	off_t tmp_off;
1568
1569	KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
1570	*attrflagp = 0;
1571	tsiz = uio_uio_resid(uiop);
1572	tmp_off = uiop->uio_offset + tsiz;
1573	NFSLOCKMNT(nmp);
1574	if (tmp_off > nmp->nm_maxfilesize || tmp_off < uiop->uio_offset) {
1575		NFSUNLOCKMNT(nmp);
1576		return (EFBIG);
1577	}
1578	wsize = nmp->nm_wsize;
1579	NFSUNLOCKMNT(nmp);
1580	nd->nd_mrep = NULL;	/* NFSv2 sometimes does a write with */
1581	nd->nd_repstat = 0;	/* uio_resid == 0, so the while is not done */
1582	while (tsiz > 0) {
1583		*attrflagp = 0;
1584		len = (tsiz > wsize) ? wsize : tsiz;
1585		NFSCL_REQSTART(nd, NFSPROC_WRITE, vp);
1586		if (nd->nd_flag & ND_NFSV4) {
1587			nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
1588			NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+2*NFSX_UNSIGNED);
1589			txdr_hyper(uiop->uio_offset, tl);
1590			tl += 2;
1591			*tl++ = txdr_unsigned(*iomode);
1592			*tl = txdr_unsigned(len);
1593		} else if (nd->nd_flag & ND_NFSV3) {
1594			NFSM_BUILD(tl, u_int32_t *, NFSX_HYPER+3*NFSX_UNSIGNED);
1595			txdr_hyper(uiop->uio_offset, tl);
1596			tl += 2;
1597			*tl++ = txdr_unsigned(len);
1598			*tl++ = txdr_unsigned(*iomode);
1599			*tl = txdr_unsigned(len);
1600		} else {
1601			u_int32_t x;
1602
1603			NFSM_BUILD(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
1604			/*
1605			 * Not sure why someone changed this, since the
1606			 * RFC clearly states that "beginoffset" and
1607			 * "totalcount" are ignored, but it wouldn't
1608			 * surprise me if there's a busted server out there.
1609			 */
1610			/* Set both "begin" and "current" to non-garbage. */
1611			x = txdr_unsigned((u_int32_t)uiop->uio_offset);
1612			*tl++ = x;      /* "begin offset" */
1613			*tl++ = x;      /* "current offset" */
1614			x = txdr_unsigned(len);
1615			*tl++ = x;      /* total to this offset */
1616			*tl = x;        /* size of this write */
1617
1618		}
1619		nfsm_uiombuf(nd, uiop, len);
1620		/*
1621		 * Although it is tempting to do a normal Getattr Op in the
1622		 * NFSv4 compound, the result can be a nearly hung client
1623		 * system if the Getattr asks for Owner and/or OwnerGroup.
1624		 * It occurs when the client can't map either the Owner or
1625		 * Owner_group name in the Getattr reply to a uid/gid. When
1626		 * there is a cache miss, the kernel does an upcall to the
1627		 * nfsuserd. Then, it can try and read the local /etc/passwd
1628		 * or /etc/group file. It can then block in getnewbuf(),
1629		 * waiting for dirty writes to be pushed to the NFS server.
1630		 * The only reason this doesn't result in a complete
1631		 * deadlock, is that the upcall times out and allows
1632		 * the write to complete. However, progress is so slow
1633		 * that it might just as well be deadlocked.
1634		 * As such, we get the rest of the attributes, but not
1635		 * Owner or Owner_group.
1636		 * nb: nfscl_loadattrcache() needs to be told that these
1637		 *     partial attributes from a write rpc are being
1638		 *     passed in, via a argument flag.
1639		 */
1640		if (nd->nd_flag & ND_NFSV4) {
1641			NFSWRITEGETATTR_ATTRBIT(&attrbits);
1642			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1643			*tl = txdr_unsigned(NFSV4OP_GETATTR);
1644			(void) nfsrv_putattrbit(nd, &attrbits);
1645		}
1646		error = nfscl_request(nd, vp, p, cred, stuff);
1647		if (error)
1648			return (error);
1649		if (nd->nd_repstat) {
1650			/*
1651			 * In case the rpc gets retried, roll
1652			 * the uio fileds changed by nfsm_uiombuf()
1653			 * back.
1654			 */
1655			uiop->uio_offset -= len;
1656			uio_uio_resid_add(uiop, len);
1657			uio_iov_base_add(uiop, -len);
1658			uio_iov_len_add(uiop, len);
1659		}
1660		if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1661			error = nfscl_wcc_data(nd, vp, nap, attrflagp,
1662			    &wccflag, stuff);
1663			if (error)
1664				goto nfsmout;
1665		}
1666		if (!nd->nd_repstat) {
1667			if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
1668				NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED
1669					+ NFSX_VERF);
1670				rlen = fxdr_unsigned(int, *tl++);
1671				if (rlen == 0) {
1672					error = NFSERR_IO;
1673					goto nfsmout;
1674				} else if (rlen < len) {
1675					backup = len - rlen;
1676					uio_iov_base_add(uiop, -(backup));
1677					uio_iov_len_add(uiop, backup);
1678					uiop->uio_offset -= backup;
1679					uio_uio_resid_add(uiop, backup);
1680					len = rlen;
1681				}
1682				commit = fxdr_unsigned(int, *tl++);
1683
1684				/*
1685				 * Return the lowest committment level
1686				 * obtained by any of the RPCs.
1687				 */
1688				if (committed == NFSWRITE_FILESYNC)
1689					committed = commit;
1690				else if (committed == NFSWRITE_DATASYNC &&
1691					commit == NFSWRITE_UNSTABLE)
1692					committed = commit;
1693				NFSLOCKMNT(nmp);
1694				if (!NFSHASWRITEVERF(nmp)) {
1695					NFSBCOPY((caddr_t)tl,
1696					    (caddr_t)&nmp->nm_verf[0],
1697					    NFSX_VERF);
1698					NFSSETWRITEVERF(nmp);
1699	    			} else if (NFSBCMP(tl, nmp->nm_verf,
1700				    NFSX_VERF)) {
1701					*must_commit = 1;
1702					NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
1703				}
1704				NFSUNLOCKMNT(nmp);
1705			}
1706			if (nd->nd_flag & ND_NFSV4)
1707				NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1708			if (nd->nd_flag & (ND_NFSV2 | ND_NFSV4)) {
1709				error = nfsm_loadattr(nd, nap);
1710				if (!error)
1711					*attrflagp = NFS_LATTR_NOSHRINK;
1712			}
1713		} else {
1714			error = nd->nd_repstat;
1715		}
1716		if (error)
1717			goto nfsmout;
1718		NFSWRITERPC_SETTIME(wccflag, np, (nd->nd_flag & ND_NFSV4));
1719		mbuf_freem(nd->nd_mrep);
1720		nd->nd_mrep = NULL;
1721		tsiz -= len;
1722	}
1723nfsmout:
1724	if (nd->nd_mrep != NULL)
1725		mbuf_freem(nd->nd_mrep);
1726	*iomode = committed;
1727	if (nd->nd_repstat && !error)
1728		error = nd->nd_repstat;
1729	return (error);
1730}
1731
1732/*
1733 * nfs mknod rpc
1734 * For NFS v2 this is a kludge. Use a create rpc but with the IFMT bits of the
1735 * mode set to specify the file type and the size field for rdev.
1736 */
1737APPLESTATIC int
1738nfsrpc_mknod(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1739    u_int32_t rdev, enum vtype vtyp, struct ucred *cred, NFSPROC_T *p,
1740    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1741    int *attrflagp, int *dattrflagp, void *dstuff)
1742{
1743	u_int32_t *tl;
1744	int error = 0;
1745	struct nfsrv_descript nfsd, *nd = &nfsd;
1746	nfsattrbit_t attrbits;
1747
1748	*nfhpp = NULL;
1749	*attrflagp = 0;
1750	*dattrflagp = 0;
1751	if (namelen > NFS_MAXNAMLEN)
1752		return (ENAMETOOLONG);
1753	NFSCL_REQSTART(nd, NFSPROC_MKNOD, dvp);
1754	if (nd->nd_flag & ND_NFSV4) {
1755		if (vtyp == VBLK || vtyp == VCHR) {
1756			NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
1757			*tl++ = vtonfsv34_type(vtyp);
1758			*tl++ = txdr_unsigned(NFSMAJOR(rdev));
1759			*tl = txdr_unsigned(NFSMINOR(rdev));
1760		} else {
1761			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1762			*tl = vtonfsv34_type(vtyp);
1763		}
1764	}
1765	(void) nfsm_strtom(nd, name, namelen);
1766	if (nd->nd_flag & ND_NFSV3) {
1767		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1768		*tl = vtonfsv34_type(vtyp);
1769	}
1770	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
1771		nfscl_fillsattr(nd, vap, dvp, 0, 0);
1772	if ((nd->nd_flag & ND_NFSV3) &&
1773	    (vtyp == VCHR || vtyp == VBLK)) {
1774		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1775		*tl++ = txdr_unsigned(NFSMAJOR(rdev));
1776		*tl = txdr_unsigned(NFSMINOR(rdev));
1777	}
1778	if (nd->nd_flag & ND_NFSV4) {
1779		NFSGETATTR_ATTRBIT(&attrbits);
1780		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1781		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
1782		*tl = txdr_unsigned(NFSV4OP_GETATTR);
1783		(void) nfsrv_putattrbit(nd, &attrbits);
1784	}
1785	if (nd->nd_flag & ND_NFSV2)
1786		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZERDEV, rdev);
1787	error = nfscl_request(nd, dvp, p, cred, dstuff);
1788	if (error)
1789		return (error);
1790	if (nd->nd_flag & ND_NFSV4)
1791		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1792	if (!nd->nd_repstat) {
1793		if (nd->nd_flag & ND_NFSV4) {
1794			NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1795			error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
1796			if (error)
1797				goto nfsmout;
1798		}
1799		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1800		if (error)
1801			goto nfsmout;
1802	}
1803	if (nd->nd_flag & ND_NFSV3)
1804		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1805	if (!error && nd->nd_repstat)
1806		error = nd->nd_repstat;
1807nfsmout:
1808	mbuf_freem(nd->nd_mrep);
1809	return (error);
1810}
1811
1812/*
1813 * nfs file create call
1814 * Mostly just call the approriate routine. (I separated out v4, so that
1815 * error recovery wouldn't be as difficult.)
1816 */
1817APPLESTATIC int
1818nfsrpc_create(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1819    nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1820    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1821    int *attrflagp, int *dattrflagp, void *dstuff)
1822{
1823	int error = 0, newone, expireret = 0, retrycnt, unlocked;
1824	struct nfsclowner *owp;
1825	struct nfscldeleg *dp;
1826	struct nfsmount *nmp = VFSTONFS(vnode_mount(dvp));
1827	u_int32_t clidrev;
1828
1829	if (NFSHASNFSV4(nmp)) {
1830	    retrycnt = 0;
1831	    do {
1832		dp = NULL;
1833		error = nfscl_open(dvp, NULL, 0, (NFSV4OPEN_ACCESSWRITE |
1834		    NFSV4OPEN_ACCESSREAD), 0, cred, p, &owp, NULL, &newone,
1835		    NULL, 1);
1836		if (error)
1837			return (error);
1838		if (nmp->nm_clp != NULL)
1839			clidrev = nmp->nm_clp->nfsc_clientidrev;
1840		else
1841			clidrev = 0;
1842		error = nfsrpc_createv4(dvp, name, namelen, vap, cverf, fmode,
1843		  owp, &dp, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1844		  dstuff, &unlocked);
1845		/*
1846		 * There is no need to invalidate cached attributes here,
1847		 * since new post-delegation issue attributes are always
1848		 * returned by nfsrpc_createv4() and these will update the
1849		 * attribute cache.
1850		 */
1851		if (dp != NULL)
1852			(void) nfscl_deleg(nmp->nm_mountp, owp->nfsow_clp,
1853			    (*nfhpp)->nfh_fh, (*nfhpp)->nfh_len, cred, p, &dp);
1854		nfscl_ownerrelease(owp, error, newone, unlocked);
1855		if (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1856		    error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1857		    error == NFSERR_BADSESSION) {
1858			(void) nfs_catnap(PZERO, error, "nfs_open");
1859		} else if ((error == NFSERR_EXPIRED ||
1860		    error == NFSERR_BADSTATEID) && clidrev != 0) {
1861			expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
1862			retrycnt++;
1863		}
1864	    } while (error == NFSERR_GRACE || error == NFSERR_STALECLIENTID ||
1865		error == NFSERR_STALEDONTRECOVER || error == NFSERR_DELAY ||
1866		error == NFSERR_BADSESSION ||
1867		((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
1868		 expireret == 0 && clidrev != 0 && retrycnt < 4));
1869	    if (error && retrycnt >= 4)
1870		    error = EIO;
1871	} else {
1872		error = nfsrpc_createv23(dvp, name, namelen, vap, cverf,
1873		    fmode, cred, p, dnap, nnap, nfhpp, attrflagp, dattrflagp,
1874		    dstuff);
1875	}
1876	return (error);
1877}
1878
1879/*
1880 * The create rpc for v2 and 3.
1881 */
1882static int
1883nfsrpc_createv23(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1884    nfsquad_t cverf, int fmode, struct ucred *cred, NFSPROC_T *p,
1885    struct nfsvattr *dnap, struct nfsvattr *nnap, struct nfsfh **nfhpp,
1886    int *attrflagp, int *dattrflagp, void *dstuff)
1887{
1888	u_int32_t *tl;
1889	int error = 0;
1890	struct nfsrv_descript nfsd, *nd = &nfsd;
1891
1892	*nfhpp = NULL;
1893	*attrflagp = 0;
1894	*dattrflagp = 0;
1895	if (namelen > NFS_MAXNAMLEN)
1896		return (ENAMETOOLONG);
1897	NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1898	(void) nfsm_strtom(nd, name, namelen);
1899	if (nd->nd_flag & ND_NFSV3) {
1900		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1901		if (fmode & O_EXCL) {
1902			*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1903			NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1904			*tl++ = cverf.lval[0];
1905			*tl = cverf.lval[1];
1906		} else {
1907			*tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1908			nfscl_fillsattr(nd, vap, dvp, 0, 0);
1909		}
1910	} else {
1911		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZE0, 0);
1912	}
1913	error = nfscl_request(nd, dvp, p, cred, dstuff);
1914	if (error)
1915		return (error);
1916	if (nd->nd_repstat == 0) {
1917		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
1918		if (error)
1919			goto nfsmout;
1920	}
1921	if (nd->nd_flag & ND_NFSV3)
1922		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
1923	if (nd->nd_repstat != 0 && error == 0)
1924		error = nd->nd_repstat;
1925nfsmout:
1926	mbuf_freem(nd->nd_mrep);
1927	return (error);
1928}
1929
1930static int
1931nfsrpc_createv4(vnode_t dvp, char *name, int namelen, struct vattr *vap,
1932    nfsquad_t cverf, int fmode, struct nfsclowner *owp, struct nfscldeleg **dpp,
1933    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
1934    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
1935    int *dattrflagp, void *dstuff, int *unlockedp)
1936{
1937	u_int32_t *tl;
1938	int error = 0, deleg, newone, ret, acesize, limitby;
1939	struct nfsrv_descript nfsd, *nd = &nfsd;
1940	struct nfsclopen *op;
1941	struct nfscldeleg *dp = NULL;
1942	struct nfsnode *np;
1943	struct nfsfh *nfhp;
1944	nfsattrbit_t attrbits;
1945	nfsv4stateid_t stateid;
1946	u_int32_t rflags;
1947	struct nfsmount *nmp;
1948
1949	nmp = VFSTONFS(dvp->v_mount);
1950	*unlockedp = 0;
1951	*nfhpp = NULL;
1952	*dpp = NULL;
1953	*attrflagp = 0;
1954	*dattrflagp = 0;
1955	if (namelen > NFS_MAXNAMLEN)
1956		return (ENAMETOOLONG);
1957	NFSCL_REQSTART(nd, NFSPROC_CREATE, dvp);
1958	/*
1959	 * For V4, this is actually an Open op.
1960	 */
1961	NFSM_BUILD(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
1962	*tl++ = txdr_unsigned(owp->nfsow_seqid);
1963	*tl++ = txdr_unsigned(NFSV4OPEN_ACCESSWRITE |
1964	    NFSV4OPEN_ACCESSREAD);
1965	*tl++ = txdr_unsigned(NFSV4OPEN_DENYNONE);
1966	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
1967	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
1968	(void) nfsm_strtom(nd, owp->nfsow_owner, NFSV4CL_LOCKNAMELEN);
1969	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
1970	*tl++ = txdr_unsigned(NFSV4OPEN_CREATE);
1971	if (fmode & O_EXCL) {
1972		if (NFSHASNFSV4N(nmp)) {
1973			if (NFSHASSESSPERSIST(nmp)) {
1974				/* Use GUARDED for persistent sessions. */
1975				*tl = txdr_unsigned(NFSCREATE_GUARDED);
1976				nfscl_fillsattr(nd, vap, dvp, 0, 0);
1977			} else {
1978				/* Otherwise, use EXCLUSIVE4_1. */
1979				*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE41);
1980				NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1981				*tl++ = cverf.lval[0];
1982				*tl = cverf.lval[1];
1983				nfscl_fillsattr(nd, vap, dvp, 0, 0);
1984			}
1985		} else {
1986			/* NFSv4.0 */
1987			*tl = txdr_unsigned(NFSCREATE_EXCLUSIVE);
1988			NFSM_BUILD(tl, u_int32_t *, NFSX_VERF);
1989			*tl++ = cverf.lval[0];
1990			*tl = cverf.lval[1];
1991		}
1992	} else {
1993		*tl = txdr_unsigned(NFSCREATE_UNCHECKED);
1994		nfscl_fillsattr(nd, vap, dvp, 0, 0);
1995	}
1996	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
1997	*tl = txdr_unsigned(NFSV4OPEN_CLAIMNULL);
1998	(void) nfsm_strtom(nd, name, namelen);
1999	NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2000	*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2001	*tl = txdr_unsigned(NFSV4OP_GETATTR);
2002	NFSGETATTR_ATTRBIT(&attrbits);
2003	(void) nfsrv_putattrbit(nd, &attrbits);
2004	error = nfscl_request(nd, dvp, p, cred, dstuff);
2005	if (error)
2006		return (error);
2007	error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2008	if (error)
2009		goto nfsmout;
2010	NFSCL_INCRSEQID(owp->nfsow_seqid, nd);
2011	if (nd->nd_repstat == 0) {
2012		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2013		    6 * NFSX_UNSIGNED);
2014		stateid.seqid = *tl++;
2015		stateid.other[0] = *tl++;
2016		stateid.other[1] = *tl++;
2017		stateid.other[2] = *tl;
2018		rflags = fxdr_unsigned(u_int32_t, *(tl + 6));
2019		(void) nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2020		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2021		deleg = fxdr_unsigned(int, *tl);
2022		if (deleg == NFSV4OPEN_DELEGATEREAD ||
2023		    deleg == NFSV4OPEN_DELEGATEWRITE) {
2024			if (!(owp->nfsow_clp->nfsc_flags &
2025			      NFSCLFLAGS_FIRSTDELEG))
2026				owp->nfsow_clp->nfsc_flags |=
2027				  (NFSCLFLAGS_FIRSTDELEG | NFSCLFLAGS_GOTDELEG);
2028			MALLOC(dp, struct nfscldeleg *,
2029			    sizeof (struct nfscldeleg) + NFSX_V4FHMAX,
2030			    M_NFSCLDELEG, M_WAITOK);
2031			LIST_INIT(&dp->nfsdl_owner);
2032			LIST_INIT(&dp->nfsdl_lock);
2033			dp->nfsdl_clp = owp->nfsow_clp;
2034			newnfs_copyincred(cred, &dp->nfsdl_cred);
2035			nfscl_lockinit(&dp->nfsdl_rwlock);
2036			NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID +
2037			    NFSX_UNSIGNED);
2038			dp->nfsdl_stateid.seqid = *tl++;
2039			dp->nfsdl_stateid.other[0] = *tl++;
2040			dp->nfsdl_stateid.other[1] = *tl++;
2041			dp->nfsdl_stateid.other[2] = *tl++;
2042			ret = fxdr_unsigned(int, *tl);
2043			if (deleg == NFSV4OPEN_DELEGATEWRITE) {
2044				dp->nfsdl_flags = NFSCLDL_WRITE;
2045				/*
2046				 * Indicates how much the file can grow.
2047				 */
2048				NFSM_DISSECT(tl, u_int32_t *,
2049				    3 * NFSX_UNSIGNED);
2050				limitby = fxdr_unsigned(int, *tl++);
2051				switch (limitby) {
2052				case NFSV4OPEN_LIMITSIZE:
2053					dp->nfsdl_sizelimit = fxdr_hyper(tl);
2054					break;
2055				case NFSV4OPEN_LIMITBLOCKS:
2056					dp->nfsdl_sizelimit =
2057					    fxdr_unsigned(u_int64_t, *tl++);
2058					dp->nfsdl_sizelimit *=
2059					    fxdr_unsigned(u_int64_t, *tl);
2060					break;
2061				default:
2062					error = NFSERR_BADXDR;
2063					goto nfsmout;
2064				};
2065			} else {
2066				dp->nfsdl_flags = NFSCLDL_READ;
2067			}
2068			if (ret)
2069				dp->nfsdl_flags |= NFSCLDL_RECALL;
2070			error = nfsrv_dissectace(nd, &dp->nfsdl_ace, &ret,
2071			    &acesize, p);
2072			if (error)
2073				goto nfsmout;
2074		} else if (deleg != NFSV4OPEN_DELEGATENONE) {
2075			error = NFSERR_BADXDR;
2076			goto nfsmout;
2077		}
2078		error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2079		if (error)
2080			goto nfsmout;
2081		if (dp != NULL && *attrflagp) {
2082			dp->nfsdl_change = nnap->na_filerev;
2083			dp->nfsdl_modtime = nnap->na_mtime;
2084			dp->nfsdl_flags |= NFSCLDL_MODTIMESET;
2085		}
2086		/*
2087		 * We can now complete the Open state.
2088		 */
2089		nfhp = *nfhpp;
2090		if (dp != NULL) {
2091			dp->nfsdl_fhlen = nfhp->nfh_len;
2092			NFSBCOPY(nfhp->nfh_fh, dp->nfsdl_fh, nfhp->nfh_len);
2093		}
2094		/*
2095		 * Get an Open structure that will be
2096		 * attached to the OpenOwner, acquired already.
2097		 */
2098		error = nfscl_open(dvp, nfhp->nfh_fh, nfhp->nfh_len,
2099		    (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), 0,
2100		    cred, p, NULL, &op, &newone, NULL, 0);
2101		if (error)
2102			goto nfsmout;
2103		op->nfso_stateid = stateid;
2104		newnfs_copyincred(cred, &op->nfso_cred);
2105		if ((rflags & NFSV4OPEN_RESULTCONFIRM)) {
2106		    do {
2107			ret = nfsrpc_openconfirm(dvp, nfhp->nfh_fh,
2108			    nfhp->nfh_len, op, cred, p);
2109			if (ret == NFSERR_DELAY)
2110			    (void) nfs_catnap(PZERO, ret, "nfs_create");
2111		    } while (ret == NFSERR_DELAY);
2112		    error = ret;
2113		}
2114
2115		/*
2116		 * If the server is handing out delegations, but we didn't
2117		 * get one because an OpenConfirm was required, try the
2118		 * Open again, to get a delegation. This is a harmless no-op,
2119		 * from a server's point of view.
2120		 */
2121		if ((rflags & NFSV4OPEN_RESULTCONFIRM) &&
2122		    (owp->nfsow_clp->nfsc_flags & NFSCLFLAGS_GOTDELEG) &&
2123		    !error && dp == NULL) {
2124		    np = VTONFS(dvp);
2125		    do {
2126			ret = nfsrpc_openrpc(VFSTONFS(vnode_mount(dvp)), dvp,
2127			    np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
2128			    nfhp->nfh_fh, nfhp->nfh_len,
2129			    (NFSV4OPEN_ACCESSWRITE | NFSV4OPEN_ACCESSREAD), op,
2130			    name, namelen, &dp, 0, 0x0, cred, p, 0, 1);
2131			if (ret == NFSERR_DELAY)
2132			    (void) nfs_catnap(PZERO, ret, "nfs_crt2");
2133		    } while (ret == NFSERR_DELAY);
2134		    if (ret) {
2135			if (dp != NULL)
2136				FREE((caddr_t)dp, M_NFSCLDELEG);
2137			if (ret == NFSERR_STALECLIENTID ||
2138			    ret == NFSERR_STALEDONTRECOVER ||
2139			    ret == NFSERR_BADSESSION)
2140				error = ret;
2141		    }
2142		}
2143		nfscl_openrelease(op, error, newone);
2144		*unlockedp = 1;
2145	}
2146	if (nd->nd_repstat != 0 && error == 0)
2147		error = nd->nd_repstat;
2148	if (error == NFSERR_STALECLIENTID || error == NFSERR_BADSESSION)
2149		nfscl_initiate_recovery(owp->nfsow_clp);
2150nfsmout:
2151	if (!error)
2152		*dpp = dp;
2153	else if (dp != NULL)
2154		FREE((caddr_t)dp, M_NFSCLDELEG);
2155	mbuf_freem(nd->nd_mrep);
2156	return (error);
2157}
2158
2159/*
2160 * Nfs remove rpc
2161 */
2162APPLESTATIC int
2163nfsrpc_remove(vnode_t dvp, char *name, int namelen, vnode_t vp,
2164    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp,
2165    void *dstuff)
2166{
2167	u_int32_t *tl;
2168	struct nfsrv_descript nfsd, *nd = &nfsd;
2169	struct nfsnode *np;
2170	struct nfsmount *nmp;
2171	nfsv4stateid_t dstateid;
2172	int error, ret = 0, i;
2173
2174	*dattrflagp = 0;
2175	if (namelen > NFS_MAXNAMLEN)
2176		return (ENAMETOOLONG);
2177	nmp = VFSTONFS(vnode_mount(dvp));
2178tryagain:
2179	if (NFSHASNFSV4(nmp) && ret == 0) {
2180		ret = nfscl_removedeleg(vp, p, &dstateid);
2181		if (ret == 1) {
2182			NFSCL_REQSTART(nd, NFSPROC_RETDELEGREMOVE, vp);
2183			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
2184			    NFSX_UNSIGNED);
2185			if (NFSHASNFSV4N(nmp))
2186				*tl++ = 0;
2187			else
2188				*tl++ = dstateid.seqid;
2189			*tl++ = dstateid.other[0];
2190			*tl++ = dstateid.other[1];
2191			*tl++ = dstateid.other[2];
2192			*tl = txdr_unsigned(NFSV4OP_PUTFH);
2193			np = VTONFS(dvp);
2194			(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2195			    np->n_fhp->nfh_len, 0);
2196			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2197			*tl = txdr_unsigned(NFSV4OP_REMOVE);
2198		}
2199	} else {
2200		ret = 0;
2201	}
2202	if (ret == 0)
2203		NFSCL_REQSTART(nd, NFSPROC_REMOVE, dvp);
2204	(void) nfsm_strtom(nd, name, namelen);
2205	error = nfscl_request(nd, dvp, p, cred, dstuff);
2206	if (error)
2207		return (error);
2208	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2209		/* For NFSv4, parse out any Delereturn replies. */
2210		if (ret > 0 && nd->nd_repstat != 0 &&
2211		    (nd->nd_flag & ND_NOMOREDATA)) {
2212			/*
2213			 * If the Delegreturn failed, try again without
2214			 * it. The server will Recall, as required.
2215			 */
2216			mbuf_freem(nd->nd_mrep);
2217			goto tryagain;
2218		}
2219		for (i = 0; i < (ret * 2); i++) {
2220			if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2221			    ND_NFSV4) {
2222			    NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2223			    if (*(tl + 1))
2224				nd->nd_flag |= ND_NOMOREDATA;
2225			}
2226		}
2227		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2228	}
2229	if (nd->nd_repstat && !error)
2230		error = nd->nd_repstat;
2231nfsmout:
2232	mbuf_freem(nd->nd_mrep);
2233	return (error);
2234}
2235
2236/*
2237 * Do an nfs rename rpc.
2238 */
2239APPLESTATIC int
2240nfsrpc_rename(vnode_t fdvp, vnode_t fvp, char *fnameptr, int fnamelen,
2241    vnode_t tdvp, vnode_t tvp, char *tnameptr, int tnamelen, struct ucred *cred,
2242    NFSPROC_T *p, struct nfsvattr *fnap, struct nfsvattr *tnap,
2243    int *fattrflagp, int *tattrflagp, void *fstuff, void *tstuff)
2244{
2245	u_int32_t *tl;
2246	struct nfsrv_descript nfsd, *nd = &nfsd;
2247	struct nfsmount *nmp;
2248	struct nfsnode *np;
2249	nfsattrbit_t attrbits;
2250	nfsv4stateid_t fdstateid, tdstateid;
2251	int error = 0, ret = 0, gottd = 0, gotfd = 0, i;
2252
2253	*fattrflagp = 0;
2254	*tattrflagp = 0;
2255	nmp = VFSTONFS(vnode_mount(fdvp));
2256	if (fnamelen > NFS_MAXNAMLEN || tnamelen > NFS_MAXNAMLEN)
2257		return (ENAMETOOLONG);
2258tryagain:
2259	if (NFSHASNFSV4(nmp) && ret == 0) {
2260		ret = nfscl_renamedeleg(fvp, &fdstateid, &gotfd, tvp,
2261		    &tdstateid, &gottd, p);
2262		if (gotfd && gottd) {
2263			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME2, fvp);
2264		} else if (gotfd) {
2265			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, fvp);
2266		} else if (gottd) {
2267			NFSCL_REQSTART(nd, NFSPROC_RETDELEGRENAME1, tvp);
2268		}
2269		if (gotfd) {
2270			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2271			if (NFSHASNFSV4N(nmp))
2272				*tl++ = 0;
2273			else
2274				*tl++ = fdstateid.seqid;
2275			*tl++ = fdstateid.other[0];
2276			*tl++ = fdstateid.other[1];
2277			*tl = fdstateid.other[2];
2278			if (gottd) {
2279				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2280				*tl = txdr_unsigned(NFSV4OP_PUTFH);
2281				np = VTONFS(tvp);
2282				(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2283				    np->n_fhp->nfh_len, 0);
2284				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2285				*tl = txdr_unsigned(NFSV4OP_DELEGRETURN);
2286			}
2287		}
2288		if (gottd) {
2289			NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
2290			if (NFSHASNFSV4N(nmp))
2291				*tl++ = 0;
2292			else
2293				*tl++ = tdstateid.seqid;
2294			*tl++ = tdstateid.other[0];
2295			*tl++ = tdstateid.other[1];
2296			*tl = tdstateid.other[2];
2297		}
2298		if (ret > 0) {
2299			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2300			*tl = txdr_unsigned(NFSV4OP_PUTFH);
2301			np = VTONFS(fdvp);
2302			(void) nfsm_fhtom(nd, np->n_fhp->nfh_fh,
2303			    np->n_fhp->nfh_len, 0);
2304			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2305			*tl = txdr_unsigned(NFSV4OP_SAVEFH);
2306		}
2307	} else {
2308		ret = 0;
2309	}
2310	if (ret == 0)
2311		NFSCL_REQSTART(nd, NFSPROC_RENAME, fdvp);
2312	if (nd->nd_flag & ND_NFSV4) {
2313		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2314		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2315		NFSWCCATTR_ATTRBIT(&attrbits);
2316		(void) nfsrv_putattrbit(nd, &attrbits);
2317		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2318		*tl = txdr_unsigned(NFSV4OP_PUTFH);
2319		(void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2320		    VTONFS(tdvp)->n_fhp->nfh_len, 0);
2321		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2322		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2323		(void) nfsrv_putattrbit(nd, &attrbits);
2324		nd->nd_flag |= ND_V4WCCATTR;
2325		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2326		*tl = txdr_unsigned(NFSV4OP_RENAME);
2327	}
2328	(void) nfsm_strtom(nd, fnameptr, fnamelen);
2329	if (!(nd->nd_flag & ND_NFSV4))
2330		(void) nfsm_fhtom(nd, VTONFS(tdvp)->n_fhp->nfh_fh,
2331			VTONFS(tdvp)->n_fhp->nfh_len, 0);
2332	(void) nfsm_strtom(nd, tnameptr, tnamelen);
2333	error = nfscl_request(nd, fdvp, p, cred, fstuff);
2334	if (error)
2335		return (error);
2336	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4)) {
2337		/* For NFSv4, parse out any Delereturn replies. */
2338		if (ret > 0 && nd->nd_repstat != 0 &&
2339		    (nd->nd_flag & ND_NOMOREDATA)) {
2340			/*
2341			 * If the Delegreturn failed, try again without
2342			 * it. The server will Recall, as required.
2343			 */
2344			mbuf_freem(nd->nd_mrep);
2345			goto tryagain;
2346		}
2347		for (i = 0; i < (ret * 2); i++) {
2348			if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) ==
2349			    ND_NFSV4) {
2350			    NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2351			    if (*(tl + 1)) {
2352				if (i == 0 && ret > 1) {
2353				    /*
2354				     * If the Delegreturn failed, try again
2355				     * without it. The server will Recall, as
2356				     * required.
2357				     * If ret > 1, the first iteration of this
2358				     * loop is the second DelegReturn result.
2359				     */
2360				    mbuf_freem(nd->nd_mrep);
2361				    goto tryagain;
2362				} else {
2363				    nd->nd_flag |= ND_NOMOREDATA;
2364				}
2365			    }
2366			}
2367		}
2368		/* Now, the first wcc attribute reply. */
2369		if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2370			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2371			if (*(tl + 1))
2372				nd->nd_flag |= ND_NOMOREDATA;
2373		}
2374		error = nfscl_wcc_data(nd, fdvp, fnap, fattrflagp, NULL,
2375		    fstuff);
2376		/* and the second wcc attribute reply. */
2377		if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4 &&
2378		    !error) {
2379			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2380			if (*(tl + 1))
2381				nd->nd_flag |= ND_NOMOREDATA;
2382		}
2383		if (!error)
2384			error = nfscl_wcc_data(nd, tdvp, tnap, tattrflagp,
2385			    NULL, tstuff);
2386	}
2387	if (nd->nd_repstat && !error)
2388		error = nd->nd_repstat;
2389nfsmout:
2390	mbuf_freem(nd->nd_mrep);
2391	return (error);
2392}
2393
2394/*
2395 * nfs hard link create rpc
2396 */
2397APPLESTATIC int
2398nfsrpc_link(vnode_t dvp, vnode_t vp, char *name, int namelen,
2399    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2400    struct nfsvattr *nap, int *attrflagp, int *dattrflagp, void *dstuff)
2401{
2402	u_int32_t *tl;
2403	struct nfsrv_descript nfsd, *nd = &nfsd;
2404	nfsattrbit_t attrbits;
2405	int error = 0;
2406
2407	*attrflagp = 0;
2408	*dattrflagp = 0;
2409	if (namelen > NFS_MAXNAMLEN)
2410		return (ENAMETOOLONG);
2411	NFSCL_REQSTART(nd, NFSPROC_LINK, vp);
2412	if (nd->nd_flag & ND_NFSV4) {
2413		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2414		*tl = txdr_unsigned(NFSV4OP_PUTFH);
2415	}
2416	(void) nfsm_fhtom(nd, VTONFS(dvp)->n_fhp->nfh_fh,
2417		VTONFS(dvp)->n_fhp->nfh_len, 0);
2418	if (nd->nd_flag & ND_NFSV4) {
2419		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2420		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2421		NFSWCCATTR_ATTRBIT(&attrbits);
2422		(void) nfsrv_putattrbit(nd, &attrbits);
2423		nd->nd_flag |= ND_V4WCCATTR;
2424		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2425		*tl = txdr_unsigned(NFSV4OP_LINK);
2426	}
2427	(void) nfsm_strtom(nd, name, namelen);
2428	error = nfscl_request(nd, vp, p, cred, dstuff);
2429	if (error)
2430		return (error);
2431	if (nd->nd_flag & ND_NFSV3) {
2432		error = nfscl_postop_attr(nd, nap, attrflagp, dstuff);
2433		if (!error)
2434			error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2435			    NULL, dstuff);
2436	} else if ((nd->nd_flag & (ND_NFSV4 | ND_NOMOREDATA)) == ND_NFSV4) {
2437		/*
2438		 * First, parse out the PutFH and Getattr result.
2439		 */
2440		NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2441		if (!(*(tl + 1)))
2442			NFSM_DISSECT(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2443		if (*(tl + 1))
2444			nd->nd_flag |= ND_NOMOREDATA;
2445		/*
2446		 * Get the pre-op attributes.
2447		 */
2448		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2449	}
2450	if (nd->nd_repstat && !error)
2451		error = nd->nd_repstat;
2452nfsmout:
2453	mbuf_freem(nd->nd_mrep);
2454	return (error);
2455}
2456
2457/*
2458 * nfs symbolic link create rpc
2459 */
2460APPLESTATIC int
2461nfsrpc_symlink(vnode_t dvp, char *name, int namelen, char *target,
2462    struct vattr *vap, struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2463    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2464    int *dattrflagp, void *dstuff)
2465{
2466	u_int32_t *tl;
2467	struct nfsrv_descript nfsd, *nd = &nfsd;
2468	struct nfsmount *nmp;
2469	int slen, error = 0;
2470
2471	*nfhpp = NULL;
2472	*attrflagp = 0;
2473	*dattrflagp = 0;
2474	nmp = VFSTONFS(vnode_mount(dvp));
2475	slen = strlen(target);
2476	if (slen > NFS_MAXPATHLEN || namelen > NFS_MAXNAMLEN)
2477		return (ENAMETOOLONG);
2478	NFSCL_REQSTART(nd, NFSPROC_SYMLINK, dvp);
2479	if (nd->nd_flag & ND_NFSV4) {
2480		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2481		*tl = txdr_unsigned(NFLNK);
2482		(void) nfsm_strtom(nd, target, slen);
2483	}
2484	(void) nfsm_strtom(nd, name, namelen);
2485	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2486		nfscl_fillsattr(nd, vap, dvp, 0, 0);
2487	if (!(nd->nd_flag & ND_NFSV4))
2488		(void) nfsm_strtom(nd, target, slen);
2489	if (nd->nd_flag & ND_NFSV2)
2490		nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2491	error = nfscl_request(nd, dvp, p, cred, dstuff);
2492	if (error)
2493		return (error);
2494	if (nd->nd_flag & ND_NFSV4)
2495		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2496	if ((nd->nd_flag & ND_NFSV3) && !error) {
2497		if (!nd->nd_repstat)
2498			error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2499		if (!error)
2500			error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp,
2501			    NULL, dstuff);
2502	}
2503	if (nd->nd_repstat && !error)
2504		error = nd->nd_repstat;
2505	mbuf_freem(nd->nd_mrep);
2506	/*
2507	 * Kludge: Map EEXIST => 0 assuming that it is a reply to a retry.
2508	 */
2509	if (error == EEXIST)
2510		error = 0;
2511	return (error);
2512}
2513
2514/*
2515 * nfs make dir rpc
2516 */
2517APPLESTATIC int
2518nfsrpc_mkdir(vnode_t dvp, char *name, int namelen, struct vattr *vap,
2519    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *dnap,
2520    struct nfsvattr *nnap, struct nfsfh **nfhpp, int *attrflagp,
2521    int *dattrflagp, void *dstuff)
2522{
2523	u_int32_t *tl;
2524	struct nfsrv_descript nfsd, *nd = &nfsd;
2525	nfsattrbit_t attrbits;
2526	int error = 0;
2527
2528	*nfhpp = NULL;
2529	*attrflagp = 0;
2530	*dattrflagp = 0;
2531	if (namelen > NFS_MAXNAMLEN)
2532		return (ENAMETOOLONG);
2533	NFSCL_REQSTART(nd, NFSPROC_MKDIR, dvp);
2534	if (nd->nd_flag & ND_NFSV4) {
2535		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2536		*tl = txdr_unsigned(NFDIR);
2537	}
2538	(void) nfsm_strtom(nd, name, namelen);
2539	nfscl_fillsattr(nd, vap, dvp, NFSSATTR_SIZENEG1, 0);
2540	if (nd->nd_flag & ND_NFSV4) {
2541		NFSGETATTR_ATTRBIT(&attrbits);
2542		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2543		*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2544		*tl = txdr_unsigned(NFSV4OP_GETATTR);
2545		(void) nfsrv_putattrbit(nd, &attrbits);
2546	}
2547	error = nfscl_request(nd, dvp, p, cred, dstuff);
2548	if (error)
2549		return (error);
2550	if (nd->nd_flag & ND_NFSV4)
2551		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2552	if (!nd->nd_repstat && !error) {
2553		if (nd->nd_flag & ND_NFSV4) {
2554			NFSM_DISSECT(tl, u_int32_t *, 5 * NFSX_UNSIGNED);
2555			error = nfsrv_getattrbits(nd, &attrbits, NULL, NULL);
2556		}
2557		if (!error)
2558			error = nfscl_mtofh(nd, nfhpp, nnap, attrflagp);
2559	}
2560	if ((nd->nd_flag & ND_NFSV3) && !error)
2561		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2562	if (nd->nd_repstat && !error)
2563		error = nd->nd_repstat;
2564nfsmout:
2565	mbuf_freem(nd->nd_mrep);
2566	/*
2567	 * Kludge: Map EEXIST => 0 assuming that you have a reply to a retry.
2568	 */
2569	if (error == EEXIST)
2570		error = 0;
2571	return (error);
2572}
2573
2574/*
2575 * nfs remove directory call
2576 */
2577APPLESTATIC int
2578nfsrpc_rmdir(vnode_t dvp, char *name, int namelen, struct ucred *cred,
2579    NFSPROC_T *p, struct nfsvattr *dnap, int *dattrflagp, void *dstuff)
2580{
2581	struct nfsrv_descript nfsd, *nd = &nfsd;
2582	int error = 0;
2583
2584	*dattrflagp = 0;
2585	if (namelen > NFS_MAXNAMLEN)
2586		return (ENAMETOOLONG);
2587	NFSCL_REQSTART(nd, NFSPROC_RMDIR, dvp);
2588	(void) nfsm_strtom(nd, name, namelen);
2589	error = nfscl_request(nd, dvp, p, cred, dstuff);
2590	if (error)
2591		return (error);
2592	if (nd->nd_flag & (ND_NFSV3 | ND_NFSV4))
2593		error = nfscl_wcc_data(nd, dvp, dnap, dattrflagp, NULL, dstuff);
2594	if (nd->nd_repstat && !error)
2595		error = nd->nd_repstat;
2596	mbuf_freem(nd->nd_mrep);
2597	/*
2598	 * Kludge: Map ENOENT => 0 assuming that you have a reply to a retry.
2599	 */
2600	if (error == ENOENT)
2601		error = 0;
2602	return (error);
2603}
2604
2605/*
2606 * Readdir rpc.
2607 * Always returns with either uio_resid unchanged, if you are at the
2608 * end of the directory, or uio_resid == 0, with all DIRBLKSIZ chunks
2609 * filled in.
2610 * I felt this would allow caching of directory blocks more easily
2611 * than returning a pertially filled block.
2612 * Directory offset cookies:
2613 * Oh my, what to do with them...
2614 * I can think of three ways to deal with them:
2615 * 1 - have the layer above these RPCs maintain a map between logical
2616 *     directory byte offsets and the NFS directory offset cookies
2617 * 2 - pass the opaque directory offset cookies up into userland
2618 *     and let the libc functions deal with them, via the system call
2619 * 3 - return them to userland in the "struct dirent", so future versions
2620 *     of libc can use them and do whatever is necessary to amke things work
2621 *     above these rpc calls, in the meantime
2622 * For now, I do #3 by "hiding" the directory offset cookies after the
2623 * d_name field in struct dirent. This is space inside d_reclen that
2624 * will be ignored by anything that doesn't know about them.
2625 * The directory offset cookies are filled in as the last 8 bytes of
2626 * each directory entry, after d_name. Someday, the userland libc
2627 * functions may be able to use these. In the meantime, it satisfies
2628 * OpenBSD's requirements for cookies being returned.
2629 * If expects the directory offset cookie for the read to be in uio_offset
2630 * and returns the one for the next entry after this directory block in
2631 * there, as well.
2632 */
2633APPLESTATIC int
2634nfsrpc_readdir(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
2635    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
2636    int *eofp, void *stuff)
2637{
2638	int len, left;
2639	struct dirent *dp = NULL;
2640	u_int32_t *tl;
2641	nfsquad_t cookie, ncookie;
2642	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
2643	struct nfsnode *dnp = VTONFS(vp);
2644	struct nfsvattr nfsva;
2645	struct nfsrv_descript nfsd, *nd = &nfsd;
2646	int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
2647	int reqsize, tryformoredirs = 1, readsize, eof = 0, gotmnton = 0;
2648	long dotfileid, dotdotfileid = 0;
2649	u_int32_t fakefileno = 0xffffffff, rderr;
2650	char *cp;
2651	nfsattrbit_t attrbits, dattrbits;
2652	u_int32_t *tl2 = NULL;
2653	size_t tresid;
2654
2655	KASSERT(uiop->uio_iovcnt == 1 &&
2656	    (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
2657	    ("nfs readdirrpc bad uio"));
2658
2659	/*
2660	 * There is no point in reading a lot more than uio_resid, however
2661	 * adding one additional DIRBLKSIZ makes sense. Since uio_resid
2662	 * and nm_readdirsize are both exact multiples of DIRBLKSIZ, this
2663	 * will never make readsize > nm_readdirsize.
2664	 */
2665	readsize = nmp->nm_readdirsize;
2666	if (readsize > uio_uio_resid(uiop))
2667		readsize = uio_uio_resid(uiop) + DIRBLKSIZ;
2668
2669	*attrflagp = 0;
2670	if (eofp)
2671		*eofp = 0;
2672	tresid = uio_uio_resid(uiop);
2673	cookie.lval[0] = cookiep->nfsuquad[0];
2674	cookie.lval[1] = cookiep->nfsuquad[1];
2675	nd->nd_mrep = NULL;
2676
2677	/*
2678	 * For NFSv4, first create the "." and ".." entries.
2679	 */
2680	if (NFSHASNFSV4(nmp)) {
2681		reqsize = 6 * NFSX_UNSIGNED;
2682		NFSGETATTR_ATTRBIT(&dattrbits);
2683		NFSZERO_ATTRBIT(&attrbits);
2684		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
2685		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_TYPE);
2686		if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
2687		    NFSATTRBIT_MOUNTEDONFILEID)) {
2688			NFSSETBIT_ATTRBIT(&attrbits,
2689			    NFSATTRBIT_MOUNTEDONFILEID);
2690			gotmnton = 1;
2691		} else {
2692			/*
2693			 * Must fake it. Use the fileno, except when the
2694			 * fsid is != to that of the directory. For that
2695			 * case, generate a fake fileno that is not the same.
2696			 */
2697			NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
2698			gotmnton = 0;
2699		}
2700
2701		/*
2702		 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
2703		 */
2704		if (uiop->uio_offset == 0) {
2705#if defined(__FreeBSD_version) && __FreeBSD_version >= 800000
2706			error = VOP_GETATTR(vp, &nfsva.na_vattr, cred);
2707#else
2708			error = VOP_GETATTR(vp, &nfsva.na_vattr, cred, p);
2709#endif
2710			if (error)
2711			    return (error);
2712			dotfileid = nfsva.na_fileid;
2713			NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
2714			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2715			*tl++ = txdr_unsigned(NFSV4OP_GETFH);
2716			*tl = txdr_unsigned(NFSV4OP_GETATTR);
2717			(void) nfsrv_putattrbit(nd, &attrbits);
2718			error = nfscl_request(nd, vp, p, cred, stuff);
2719			if (error)
2720			    return (error);
2721			if (nd->nd_repstat == 0) {
2722			    NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2723			    len = fxdr_unsigned(int, *(tl + 2));
2724			    if (len > 0 && len <= NFSX_V4FHMAX)
2725				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2726			    else
2727				error = EPERM;
2728			    if (!error) {
2729				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2730				nfsva.na_mntonfileno = 0xffffffff;
2731				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2732				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2733				    NULL, NULL, NULL, p, cred);
2734				if (error) {
2735				    dotdotfileid = dotfileid;
2736				} else if (gotmnton) {
2737				    if (nfsva.na_mntonfileno != 0xffffffff)
2738					dotdotfileid = nfsva.na_mntonfileno;
2739				    else
2740					dotdotfileid = nfsva.na_fileid;
2741				} else if (nfsva.na_filesid[0] ==
2742				    dnp->n_vattr.na_filesid[0] &&
2743				    nfsva.na_filesid[1] ==
2744				    dnp->n_vattr.na_filesid[1]) {
2745				    dotdotfileid = nfsva.na_fileid;
2746				} else {
2747				    do {
2748					fakefileno--;
2749				    } while (fakefileno ==
2750					nfsva.na_fileid);
2751				    dotdotfileid = fakefileno;
2752				}
2753			    }
2754			} else if (nd->nd_repstat == NFSERR_NOENT) {
2755			    /*
2756			     * Lookupp returns NFSERR_NOENT when we are
2757			     * at the root, so just use the current dir.
2758			     */
2759			    nd->nd_repstat = 0;
2760			    dotdotfileid = dotfileid;
2761			} else {
2762			    error = nd->nd_repstat;
2763			}
2764			mbuf_freem(nd->nd_mrep);
2765			if (error)
2766			    return (error);
2767			nd->nd_mrep = NULL;
2768			dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2769			dp->d_type = DT_DIR;
2770			dp->d_fileno = dotfileid;
2771			dp->d_namlen = 1;
2772			dp->d_name[0] = '.';
2773			dp->d_name[1] = '\0';
2774			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2775			/*
2776			 * Just make these offset cookie 0.
2777			 */
2778			tl = (u_int32_t *)&dp->d_name[4];
2779			*tl++ = 0;
2780			*tl = 0;
2781			blksiz += dp->d_reclen;
2782			uio_uio_resid_add(uiop, -(dp->d_reclen));
2783			uiop->uio_offset += dp->d_reclen;
2784			uio_iov_base_add(uiop, dp->d_reclen);
2785			uio_iov_len_add(uiop, -(dp->d_reclen));
2786			dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2787			dp->d_type = DT_DIR;
2788			dp->d_fileno = dotdotfileid;
2789			dp->d_namlen = 2;
2790			dp->d_name[0] = '.';
2791			dp->d_name[1] = '.';
2792			dp->d_name[2] = '\0';
2793			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
2794			/*
2795			 * Just make these offset cookie 0.
2796			 */
2797			tl = (u_int32_t *)&dp->d_name[4];
2798			*tl++ = 0;
2799			*tl = 0;
2800			blksiz += dp->d_reclen;
2801			uio_uio_resid_add(uiop, -(dp->d_reclen));
2802			uiop->uio_offset += dp->d_reclen;
2803			uio_iov_base_add(uiop, dp->d_reclen);
2804			uio_iov_len_add(uiop, -(dp->d_reclen));
2805		}
2806		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_RDATTRERROR);
2807	} else {
2808		reqsize = 5 * NFSX_UNSIGNED;
2809	}
2810
2811
2812	/*
2813	 * Loop around doing readdir rpc's of size readsize.
2814	 * The stopping criteria is EOF or buffer full.
2815	 */
2816	while (more_dirs && bigenough) {
2817		*attrflagp = 0;
2818		NFSCL_REQSTART(nd, NFSPROC_READDIR, vp);
2819		if (nd->nd_flag & ND_NFSV2) {
2820			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
2821			*tl++ = cookie.lval[1];
2822			*tl = txdr_unsigned(readsize);
2823		} else {
2824			NFSM_BUILD(tl, u_int32_t *, reqsize);
2825			*tl++ = cookie.lval[0];
2826			*tl++ = cookie.lval[1];
2827			if (cookie.qval == 0) {
2828				*tl++ = 0;
2829				*tl++ = 0;
2830			} else {
2831				NFSLOCKNODE(dnp);
2832				*tl++ = dnp->n_cookieverf.nfsuquad[0];
2833				*tl++ = dnp->n_cookieverf.nfsuquad[1];
2834				NFSUNLOCKNODE(dnp);
2835			}
2836			if (nd->nd_flag & ND_NFSV4) {
2837				*tl++ = txdr_unsigned(readsize);
2838				*tl = txdr_unsigned(readsize);
2839				(void) nfsrv_putattrbit(nd, &attrbits);
2840				NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
2841				*tl = txdr_unsigned(NFSV4OP_GETATTR);
2842				(void) nfsrv_putattrbit(nd, &dattrbits);
2843			} else {
2844				*tl = txdr_unsigned(readsize);
2845			}
2846		}
2847		error = nfscl_request(nd, vp, p, cred, stuff);
2848		if (error)
2849			return (error);
2850		if (!(nd->nd_flag & ND_NFSV2)) {
2851			if (nd->nd_flag & ND_NFSV3)
2852				error = nfscl_postop_attr(nd, nap, attrflagp,
2853				    stuff);
2854			if (!nd->nd_repstat && !error) {
2855				NFSM_DISSECT(tl, u_int32_t *, NFSX_HYPER);
2856				NFSLOCKNODE(dnp);
2857				dnp->n_cookieverf.nfsuquad[0] = *tl++;
2858				dnp->n_cookieverf.nfsuquad[1] = *tl;
2859				NFSUNLOCKNODE(dnp);
2860			}
2861		}
2862		if (nd->nd_repstat || error) {
2863			if (!error)
2864				error = nd->nd_repstat;
2865			goto nfsmout;
2866		}
2867		NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2868		more_dirs = fxdr_unsigned(int, *tl);
2869		if (!more_dirs)
2870			tryformoredirs = 0;
2871
2872		/* loop thru the dir entries, doctoring them to 4bsd form */
2873		while (more_dirs && bigenough) {
2874			if (nd->nd_flag & ND_NFSV4) {
2875				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2876				ncookie.lval[0] = *tl++;
2877				ncookie.lval[1] = *tl++;
2878				len = fxdr_unsigned(int, *tl);
2879			} else if (nd->nd_flag & ND_NFSV3) {
2880				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2881				nfsva.na_fileid = fxdr_hyper(tl);
2882				tl += 2;
2883				len = fxdr_unsigned(int, *tl);
2884			} else {
2885				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2886				nfsva.na_fileid =
2887				    fxdr_unsigned(long, *tl++);
2888				len = fxdr_unsigned(int, *tl);
2889			}
2890			if (len <= 0 || len > NFS_MAXNAMLEN) {
2891				error = EBADRPC;
2892				goto nfsmout;
2893			}
2894			tlen = NFSM_RNDUP(len);
2895			if (tlen == len)
2896				tlen += 4;  /* To ensure null termination */
2897			left = DIRBLKSIZ - blksiz;
2898			if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > left) {
2899				dp->d_reclen += left;
2900				uio_iov_base_add(uiop, left);
2901				uio_iov_len_add(uiop, -(left));
2902				uio_uio_resid_add(uiop, -(left));
2903				uiop->uio_offset += left;
2904				blksiz = 0;
2905			}
2906			if ((int)(tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
2907				bigenough = 0;
2908			if (bigenough) {
2909				dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
2910				dp->d_namlen = len;
2911				dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
2912				dp->d_type = DT_UNKNOWN;
2913				blksiz += dp->d_reclen;
2914				if (blksiz == DIRBLKSIZ)
2915					blksiz = 0;
2916				uio_uio_resid_add(uiop, -(DIRHDSIZ));
2917				uiop->uio_offset += DIRHDSIZ;
2918				uio_iov_base_add(uiop, DIRHDSIZ);
2919				uio_iov_len_add(uiop, -(DIRHDSIZ));
2920				error = nfsm_mbufuio(nd, uiop, len);
2921				if (error)
2922					goto nfsmout;
2923				cp = CAST_DOWN(caddr_t, uio_iov_base(uiop));
2924				tlen -= len;
2925				*cp = '\0';	/* null terminate */
2926				cp += tlen;	/* points to cookie storage */
2927				tl2 = (u_int32_t *)cp;
2928				uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
2929				uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
2930				uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
2931				uiop->uio_offset += (tlen + NFSX_HYPER);
2932			} else {
2933				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
2934				if (error)
2935					goto nfsmout;
2936			}
2937			if (nd->nd_flag & ND_NFSV4) {
2938				rderr = 0;
2939				nfsva.na_mntonfileno = 0xffffffff;
2940				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
2941				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
2942				    NULL, NULL, &rderr, p, cred);
2943				if (error)
2944					goto nfsmout;
2945				NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2946			} else if (nd->nd_flag & ND_NFSV3) {
2947				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
2948				ncookie.lval[0] = *tl++;
2949				ncookie.lval[1] = *tl++;
2950			} else {
2951				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
2952				ncookie.lval[0] = 0;
2953				ncookie.lval[1] = *tl++;
2954			}
2955			if (bigenough) {
2956			    if (nd->nd_flag & ND_NFSV4) {
2957				if (rderr) {
2958				    dp->d_fileno = 0;
2959				} else {
2960				    if (gotmnton) {
2961					if (nfsva.na_mntonfileno != 0xffffffff)
2962					    dp->d_fileno = nfsva.na_mntonfileno;
2963					else
2964					    dp->d_fileno = nfsva.na_fileid;
2965				    } else if (nfsva.na_filesid[0] ==
2966					dnp->n_vattr.na_filesid[0] &&
2967					nfsva.na_filesid[1] ==
2968					dnp->n_vattr.na_filesid[1]) {
2969					dp->d_fileno = nfsva.na_fileid;
2970				    } else {
2971					do {
2972					    fakefileno--;
2973					} while (fakefileno ==
2974					    nfsva.na_fileid);
2975					dp->d_fileno = fakefileno;
2976				    }
2977				    dp->d_type = vtonfs_dtype(nfsva.na_type);
2978				}
2979			    } else {
2980				dp->d_fileno = nfsva.na_fileid;
2981			    }
2982			    *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
2983				ncookie.lval[0];
2984			    *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
2985				ncookie.lval[1];
2986			}
2987			more_dirs = fxdr_unsigned(int, *tl);
2988		}
2989		/*
2990		 * If at end of rpc data, get the eof boolean
2991		 */
2992		if (!more_dirs) {
2993			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
2994			eof = fxdr_unsigned(int, *tl);
2995			if (tryformoredirs)
2996				more_dirs = !eof;
2997			if (nd->nd_flag & ND_NFSV4) {
2998				error = nfscl_postop_attr(nd, nap, attrflagp,
2999				    stuff);
3000				if (error)
3001					goto nfsmout;
3002			}
3003		}
3004		mbuf_freem(nd->nd_mrep);
3005		nd->nd_mrep = NULL;
3006	}
3007	/*
3008	 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3009	 * by increasing d_reclen for the last record.
3010	 */
3011	if (blksiz > 0) {
3012		left = DIRBLKSIZ - blksiz;
3013		dp->d_reclen += left;
3014		uio_iov_base_add(uiop, left);
3015		uio_iov_len_add(uiop, -(left));
3016		uio_uio_resid_add(uiop, -(left));
3017		uiop->uio_offset += left;
3018	}
3019
3020	/*
3021	 * If returning no data, assume end of file.
3022	 * If not bigenough, return not end of file, since you aren't
3023	 *    returning all the data
3024	 * Otherwise, return the eof flag from the server.
3025	 */
3026	if (eofp) {
3027		if (tresid == ((size_t)(uio_uio_resid(uiop))))
3028			*eofp = 1;
3029		else if (!bigenough)
3030			*eofp = 0;
3031		else
3032			*eofp = eof;
3033	}
3034
3035	/*
3036	 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3037	 */
3038	while (uio_uio_resid(uiop) > 0 && ((size_t)(uio_uio_resid(uiop))) != tresid) {
3039		dp = (struct dirent *) CAST_DOWN(caddr_t, uio_iov_base(uiop));
3040		dp->d_type = DT_UNKNOWN;
3041		dp->d_fileno = 0;
3042		dp->d_namlen = 0;
3043		dp->d_name[0] = '\0';
3044		tl = (u_int32_t *)&dp->d_name[4];
3045		*tl++ = cookie.lval[0];
3046		*tl = cookie.lval[1];
3047		dp->d_reclen = DIRBLKSIZ;
3048		uio_iov_base_add(uiop, DIRBLKSIZ);
3049		uio_iov_len_add(uiop, -(DIRBLKSIZ));
3050		uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3051		uiop->uio_offset += DIRBLKSIZ;
3052	}
3053
3054nfsmout:
3055	if (nd->nd_mrep != NULL)
3056		mbuf_freem(nd->nd_mrep);
3057	return (error);
3058}
3059
3060#ifndef APPLE
3061/*
3062 * NFS V3 readdir plus RPC. Used in place of nfsrpc_readdir().
3063 * (Also used for NFS V4 when mount flag set.)
3064 * (ditto above w.r.t. multiple of DIRBLKSIZ, etc.)
3065 */
3066APPLESTATIC int
3067nfsrpc_readdirplus(vnode_t vp, struct uio *uiop, nfsuint64 *cookiep,
3068    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3069    int *eofp, void *stuff)
3070{
3071	int len, left;
3072	struct dirent *dp = NULL;
3073	u_int32_t *tl;
3074	vnode_t newvp = NULLVP;
3075	struct nfsrv_descript nfsd, *nd = &nfsd;
3076	struct nameidata nami, *ndp = &nami;
3077	struct componentname *cnp = &ndp->ni_cnd;
3078	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3079	struct nfsnode *dnp = VTONFS(vp), *np;
3080	struct nfsvattr nfsva;
3081	struct nfsfh *nfhp;
3082	nfsquad_t cookie, ncookie;
3083	int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
3084	int attrflag, tryformoredirs = 1, eof = 0, gotmnton = 0;
3085	int isdotdot = 0, unlocknewvp = 0;
3086	long dotfileid, dotdotfileid = 0, fileno = 0;
3087	char *cp;
3088	nfsattrbit_t attrbits, dattrbits;
3089	size_t tresid;
3090	u_int32_t *tl2 = NULL, fakefileno = 0xffffffff, rderr;
3091	struct timespec dctime;
3092
3093	KASSERT(uiop->uio_iovcnt == 1 &&
3094	    (uio_uio_resid(uiop) & (DIRBLKSIZ - 1)) == 0,
3095	    ("nfs readdirplusrpc bad uio"));
3096	timespecclear(&dctime);
3097	*attrflagp = 0;
3098	if (eofp != NULL)
3099		*eofp = 0;
3100	ndp->ni_dvp = vp;
3101	nd->nd_mrep = NULL;
3102	cookie.lval[0] = cookiep->nfsuquad[0];
3103	cookie.lval[1] = cookiep->nfsuquad[1];
3104	tresid = uio_uio_resid(uiop);
3105
3106	/*
3107	 * For NFSv4, first create the "." and ".." entries.
3108	 */
3109	if (NFSHASNFSV4(nmp)) {
3110		NFSGETATTR_ATTRBIT(&dattrbits);
3111		NFSZERO_ATTRBIT(&attrbits);
3112		NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FILEID);
3113		if (NFSISSET_ATTRBIT(&dnp->n_vattr.na_suppattr,
3114		    NFSATTRBIT_MOUNTEDONFILEID)) {
3115			NFSSETBIT_ATTRBIT(&attrbits,
3116			    NFSATTRBIT_MOUNTEDONFILEID);
3117			gotmnton = 1;
3118		} else {
3119			/*
3120			 * Must fake it. Use the fileno, except when the
3121			 * fsid is != to that of the directory. For that
3122			 * case, generate a fake fileno that is not the same.
3123			 */
3124			NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_FSID);
3125			gotmnton = 0;
3126		}
3127
3128		/*
3129		 * Joy, oh joy. For V4 we get to hand craft '.' and '..'.
3130		 */
3131		if (uiop->uio_offset == 0) {
3132#if defined(__FreeBSD_version) && __FreeBSD_version >= 800000
3133			error = VOP_GETATTR(vp, &nfsva.na_vattr, cred);
3134#else
3135			error = VOP_GETATTR(vp, &nfsva.na_vattr, cred, p);
3136#endif
3137			if (error)
3138			    return (error);
3139			dctime = nfsva.na_ctime;
3140			dotfileid = nfsva.na_fileid;
3141			NFSCL_REQSTART(nd, NFSPROC_LOOKUPP, vp);
3142			NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
3143			*tl++ = txdr_unsigned(NFSV4OP_GETFH);
3144			*tl = txdr_unsigned(NFSV4OP_GETATTR);
3145			(void) nfsrv_putattrbit(nd, &attrbits);
3146			error = nfscl_request(nd, vp, p, cred, stuff);
3147			if (error)
3148			    return (error);
3149			if (nd->nd_repstat == 0) {
3150			    NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3151			    len = fxdr_unsigned(int, *(tl + 2));
3152			    if (len > 0 && len <= NFSX_V4FHMAX)
3153				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3154			    else
3155				error = EPERM;
3156			    if (!error) {
3157				NFSM_DISSECT(tl, u_int32_t *, 2*NFSX_UNSIGNED);
3158				nfsva.na_mntonfileno = 0xffffffff;
3159				error = nfsv4_loadattr(nd, NULL, &nfsva, NULL,
3160				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3161				    NULL, NULL, NULL, p, cred);
3162				if (error) {
3163				    dotdotfileid = dotfileid;
3164				} else if (gotmnton) {
3165				    if (nfsva.na_mntonfileno != 0xffffffff)
3166					dotdotfileid = nfsva.na_mntonfileno;
3167				    else
3168					dotdotfileid = nfsva.na_fileid;
3169				} else if (nfsva.na_filesid[0] ==
3170				    dnp->n_vattr.na_filesid[0] &&
3171				    nfsva.na_filesid[1] ==
3172				    dnp->n_vattr.na_filesid[1]) {
3173				    dotdotfileid = nfsva.na_fileid;
3174				} else {
3175				    do {
3176					fakefileno--;
3177				    } while (fakefileno ==
3178					nfsva.na_fileid);
3179				    dotdotfileid = fakefileno;
3180				}
3181			    }
3182			} else if (nd->nd_repstat == NFSERR_NOENT) {
3183			    /*
3184			     * Lookupp returns NFSERR_NOENT when we are
3185			     * at the root, so just use the current dir.
3186			     */
3187			    nd->nd_repstat = 0;
3188			    dotdotfileid = dotfileid;
3189			} else {
3190			    error = nd->nd_repstat;
3191			}
3192			mbuf_freem(nd->nd_mrep);
3193			if (error)
3194			    return (error);
3195			nd->nd_mrep = NULL;
3196			dp = (struct dirent *)uio_iov_base(uiop);
3197			dp->d_type = DT_DIR;
3198			dp->d_fileno = dotfileid;
3199			dp->d_namlen = 1;
3200			dp->d_name[0] = '.';
3201			dp->d_name[1] = '\0';
3202			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3203			/*
3204			 * Just make these offset cookie 0.
3205			 */
3206			tl = (u_int32_t *)&dp->d_name[4];
3207			*tl++ = 0;
3208			*tl = 0;
3209			blksiz += dp->d_reclen;
3210			uio_uio_resid_add(uiop, -(dp->d_reclen));
3211			uiop->uio_offset += dp->d_reclen;
3212			uio_iov_base_add(uiop, dp->d_reclen);
3213			uio_iov_len_add(uiop, -(dp->d_reclen));
3214			dp = (struct dirent *)uio_iov_base(uiop);
3215			dp->d_type = DT_DIR;
3216			dp->d_fileno = dotdotfileid;
3217			dp->d_namlen = 2;
3218			dp->d_name[0] = '.';
3219			dp->d_name[1] = '.';
3220			dp->d_name[2] = '\0';
3221			dp->d_reclen = DIRENT_SIZE(dp) + NFSX_HYPER;
3222			/*
3223			 * Just make these offset cookie 0.
3224			 */
3225			tl = (u_int32_t *)&dp->d_name[4];
3226			*tl++ = 0;
3227			*tl = 0;
3228			blksiz += dp->d_reclen;
3229			uio_uio_resid_add(uiop, -(dp->d_reclen));
3230			uiop->uio_offset += dp->d_reclen;
3231			uio_iov_base_add(uiop, dp->d_reclen);
3232			uio_iov_len_add(uiop, -(dp->d_reclen));
3233		}
3234		NFSREADDIRPLUS_ATTRBIT(&attrbits);
3235		if (gotmnton)
3236			NFSSETBIT_ATTRBIT(&attrbits,
3237			    NFSATTRBIT_MOUNTEDONFILEID);
3238	}
3239
3240	/*
3241	 * Loop around doing readdir rpc's of size nm_readdirsize.
3242	 * The stopping criteria is EOF or buffer full.
3243	 */
3244	while (more_dirs && bigenough) {
3245		*attrflagp = 0;
3246		NFSCL_REQSTART(nd, NFSPROC_READDIRPLUS, vp);
3247 		NFSM_BUILD(tl, u_int32_t *, 6 * NFSX_UNSIGNED);
3248		*tl++ = cookie.lval[0];
3249		*tl++ = cookie.lval[1];
3250		if (cookie.qval == 0) {
3251			*tl++ = 0;
3252			*tl++ = 0;
3253		} else {
3254			NFSLOCKNODE(dnp);
3255			*tl++ = dnp->n_cookieverf.nfsuquad[0];
3256			*tl++ = dnp->n_cookieverf.nfsuquad[1];
3257			NFSUNLOCKNODE(dnp);
3258		}
3259		*tl++ = txdr_unsigned(nmp->nm_readdirsize);
3260		*tl = txdr_unsigned(nmp->nm_readdirsize);
3261		if (nd->nd_flag & ND_NFSV4) {
3262			(void) nfsrv_putattrbit(nd, &attrbits);
3263			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3264			*tl = txdr_unsigned(NFSV4OP_GETATTR);
3265			(void) nfsrv_putattrbit(nd, &dattrbits);
3266		}
3267		error = nfscl_request(nd, vp, p, cred, stuff);
3268		if (error)
3269			return (error);
3270		if (nd->nd_flag & ND_NFSV3)
3271			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3272		if (nd->nd_repstat || error) {
3273			if (!error)
3274				error = nd->nd_repstat;
3275			goto nfsmout;
3276		}
3277		if ((nd->nd_flag & ND_NFSV3) != 0 && *attrflagp != 0)
3278			dctime = nap->na_ctime;
3279		NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3280		NFSLOCKNODE(dnp);
3281		dnp->n_cookieverf.nfsuquad[0] = *tl++;
3282		dnp->n_cookieverf.nfsuquad[1] = *tl++;
3283		NFSUNLOCKNODE(dnp);
3284		more_dirs = fxdr_unsigned(int, *tl);
3285		if (!more_dirs)
3286			tryformoredirs = 0;
3287
3288		/* loop thru the dir entries, doctoring them to 4bsd form */
3289		while (more_dirs && bigenough) {
3290			NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3291			if (nd->nd_flag & ND_NFSV4) {
3292				ncookie.lval[0] = *tl++;
3293				ncookie.lval[1] = *tl++;
3294			} else {
3295				fileno = fxdr_unsigned(long, *++tl);
3296				tl++;
3297			}
3298			len = fxdr_unsigned(int, *tl);
3299			if (len <= 0 || len > NFS_MAXNAMLEN) {
3300				error = EBADRPC;
3301				goto nfsmout;
3302			}
3303			tlen = NFSM_RNDUP(len);
3304			if (tlen == len)
3305				tlen += 4;  /* To ensure null termination */
3306			left = DIRBLKSIZ - blksiz;
3307			if ((tlen + DIRHDSIZ + NFSX_HYPER) > left) {
3308				dp->d_reclen += left;
3309				uio_iov_base_add(uiop, left);
3310				uio_iov_len_add(uiop, -(left));
3311				uio_uio_resid_add(uiop, -(left));
3312				uiop->uio_offset += left;
3313				blksiz = 0;
3314			}
3315			if ((tlen + DIRHDSIZ + NFSX_HYPER) > uio_uio_resid(uiop))
3316				bigenough = 0;
3317			if (bigenough) {
3318				dp = (struct dirent *)uio_iov_base(uiop);
3319				dp->d_namlen = len;
3320				dp->d_reclen = tlen + DIRHDSIZ + NFSX_HYPER;
3321				dp->d_type = DT_UNKNOWN;
3322				blksiz += dp->d_reclen;
3323				if (blksiz == DIRBLKSIZ)
3324					blksiz = 0;
3325				uio_uio_resid_add(uiop, -(DIRHDSIZ));
3326				uiop->uio_offset += DIRHDSIZ;
3327				uio_iov_base_add(uiop, DIRHDSIZ);
3328				uio_iov_len_add(uiop, -(DIRHDSIZ));
3329				cnp->cn_nameptr = uio_iov_base(uiop);
3330				cnp->cn_namelen = len;
3331				NFSCNHASHZERO(cnp);
3332				error = nfsm_mbufuio(nd, uiop, len);
3333				if (error)
3334					goto nfsmout;
3335				cp = uio_iov_base(uiop);
3336				tlen -= len;
3337				*cp = '\0';
3338				cp += tlen;	/* points to cookie storage */
3339				tl2 = (u_int32_t *)cp;
3340				if (len == 2 && cnp->cn_nameptr[0] == '.' &&
3341				    cnp->cn_nameptr[1] == '.')
3342					isdotdot = 1;
3343				else
3344					isdotdot = 0;
3345				uio_iov_base_add(uiop, (tlen + NFSX_HYPER));
3346				uio_iov_len_add(uiop, -(tlen + NFSX_HYPER));
3347				uio_uio_resid_add(uiop, -(tlen + NFSX_HYPER));
3348				uiop->uio_offset += (tlen + NFSX_HYPER);
3349			} else {
3350				error = nfsm_advance(nd, NFSM_RNDUP(len), -1);
3351				if (error)
3352					goto nfsmout;
3353			}
3354			nfhp = NULL;
3355			if (nd->nd_flag & ND_NFSV3) {
3356				NFSM_DISSECT(tl, u_int32_t *, 3*NFSX_UNSIGNED);
3357				ncookie.lval[0] = *tl++;
3358				ncookie.lval[1] = *tl++;
3359				attrflag = fxdr_unsigned(int, *tl);
3360				if (attrflag) {
3361				  error = nfsm_loadattr(nd, &nfsva);
3362				  if (error)
3363					goto nfsmout;
3364				}
3365				NFSM_DISSECT(tl,u_int32_t *,NFSX_UNSIGNED);
3366				if (*tl) {
3367					error = nfsm_getfh(nd, &nfhp);
3368					if (error)
3369					    goto nfsmout;
3370				}
3371				if (!attrflag && nfhp != NULL) {
3372					FREE((caddr_t)nfhp, M_NFSFH);
3373					nfhp = NULL;
3374				}
3375			} else {
3376				rderr = 0;
3377				nfsva.na_mntonfileno = 0xffffffff;
3378				error = nfsv4_loadattr(nd, NULL, &nfsva, &nfhp,
3379				    NULL, 0, NULL, NULL, NULL, NULL, NULL, 0,
3380				    NULL, NULL, &rderr, p, cred);
3381				if (error)
3382					goto nfsmout;
3383			}
3384
3385			if (bigenough) {
3386			    if (nd->nd_flag & ND_NFSV4) {
3387				if (rderr) {
3388				    dp->d_fileno = 0;
3389				} else if (gotmnton) {
3390				    if (nfsva.na_mntonfileno != 0xffffffff)
3391					dp->d_fileno = nfsva.na_mntonfileno;
3392				    else
3393					dp->d_fileno = nfsva.na_fileid;
3394				} else if (nfsva.na_filesid[0] ==
3395				    dnp->n_vattr.na_filesid[0] &&
3396				    nfsva.na_filesid[1] ==
3397				    dnp->n_vattr.na_filesid[1]) {
3398				    dp->d_fileno = nfsva.na_fileid;
3399				} else {
3400				    do {
3401					fakefileno--;
3402				    } while (fakefileno ==
3403					nfsva.na_fileid);
3404				    dp->d_fileno = fakefileno;
3405				}
3406			    } else {
3407				dp->d_fileno = fileno;
3408			    }
3409			    *tl2++ = cookiep->nfsuquad[0] = cookie.lval[0] =
3410				ncookie.lval[0];
3411			    *tl2 = cookiep->nfsuquad[1] = cookie.lval[1] =
3412				ncookie.lval[1];
3413
3414			    if (nfhp != NULL) {
3415				if (NFSRV_CMPFH(nfhp->nfh_fh, nfhp->nfh_len,
3416				    dnp->n_fhp->nfh_fh, dnp->n_fhp->nfh_len)) {
3417				    VREF(vp);
3418				    newvp = vp;
3419				    unlocknewvp = 0;
3420				    FREE((caddr_t)nfhp, M_NFSFH);
3421				    np = dnp;
3422				} else if (isdotdot != 0) {
3423				    /*
3424				     * Skip doing a nfscl_nget() call for "..".
3425				     * There's a race between acquiring the nfs
3426				     * node here and lookups that look for the
3427				     * directory being read (in the parent).
3428				     * It would try to get a lock on ".." here,
3429				     * owning the lock on the directory being
3430				     * read. Lookup will hold the lock on ".."
3431				     * and try to acquire the lock on the
3432				     * directory being read.
3433				     * If the directory is unlocked/relocked,
3434				     * then there is a LOR with the buflock
3435				     * vp is relocked.
3436				     */
3437				    free(nfhp, M_NFSFH);
3438				} else {
3439				    error = nfscl_nget(vnode_mount(vp), vp,
3440				      nfhp, cnp, p, &np, NULL, LK_EXCLUSIVE);
3441				    if (!error) {
3442					newvp = NFSTOV(np);
3443					unlocknewvp = 1;
3444				    }
3445				}
3446				nfhp = NULL;
3447				if (newvp != NULLVP) {
3448				    error = nfscl_loadattrcache(&newvp,
3449					&nfsva, NULL, NULL, 0, 0);
3450				    if (error) {
3451					if (unlocknewvp)
3452					    vput(newvp);
3453					else
3454					    vrele(newvp);
3455					goto nfsmout;
3456				    }
3457				    dp->d_type =
3458					vtonfs_dtype(np->n_vattr.na_type);
3459				    ndp->ni_vp = newvp;
3460				    NFSCNHASH(cnp, HASHINIT);
3461				    if (cnp->cn_namelen <= NCHNAMLEN &&
3462					(newvp->v_type != VDIR ||
3463					 dctime.tv_sec != 0)) {
3464					cache_enter_time(ndp->ni_dvp,
3465					    ndp->ni_vp, cnp,
3466					    &nfsva.na_ctime,
3467					    newvp->v_type != VDIR ? NULL :
3468					    &dctime);
3469				    }
3470				    if (unlocknewvp)
3471					vput(newvp);
3472				    else
3473					vrele(newvp);
3474				    newvp = NULLVP;
3475				}
3476			    }
3477			} else if (nfhp != NULL) {
3478			    FREE((caddr_t)nfhp, M_NFSFH);
3479			}
3480			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3481			more_dirs = fxdr_unsigned(int, *tl);
3482		}
3483		/*
3484		 * If at end of rpc data, get the eof boolean
3485		 */
3486		if (!more_dirs) {
3487			NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED);
3488			eof = fxdr_unsigned(int, *tl);
3489			if (tryformoredirs)
3490				more_dirs = !eof;
3491			if (nd->nd_flag & ND_NFSV4) {
3492				error = nfscl_postop_attr(nd, nap, attrflagp,
3493				    stuff);
3494				if (error)
3495					goto nfsmout;
3496			}
3497		}
3498		mbuf_freem(nd->nd_mrep);
3499		nd->nd_mrep = NULL;
3500	}
3501	/*
3502	 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
3503	 * by increasing d_reclen for the last record.
3504	 */
3505	if (blksiz > 0) {
3506		left = DIRBLKSIZ - blksiz;
3507		dp->d_reclen += left;
3508		uio_iov_base_add(uiop, left);
3509		uio_iov_len_add(uiop, -(left));
3510		uio_uio_resid_add(uiop, -(left));
3511		uiop->uio_offset += left;
3512	}
3513
3514	/*
3515	 * If returning no data, assume end of file.
3516	 * If not bigenough, return not end of file, since you aren't
3517	 *    returning all the data
3518	 * Otherwise, return the eof flag from the server.
3519	 */
3520	if (eofp != NULL) {
3521		if (tresid == uio_uio_resid(uiop))
3522			*eofp = 1;
3523		else if (!bigenough)
3524			*eofp = 0;
3525		else
3526			*eofp = eof;
3527	}
3528
3529	/*
3530	 * Add extra empty records to any remaining DIRBLKSIZ chunks.
3531	 */
3532	while (uio_uio_resid(uiop) > 0 && uio_uio_resid(uiop) != tresid) {
3533		dp = (struct dirent *)uio_iov_base(uiop);
3534		dp->d_type = DT_UNKNOWN;
3535		dp->d_fileno = 0;
3536		dp->d_namlen = 0;
3537		dp->d_name[0] = '\0';
3538		tl = (u_int32_t *)&dp->d_name[4];
3539		*tl++ = cookie.lval[0];
3540		*tl = cookie.lval[1];
3541		dp->d_reclen = DIRBLKSIZ;
3542		uio_iov_base_add(uiop, DIRBLKSIZ);
3543		uio_iov_len_add(uiop, -(DIRBLKSIZ));
3544		uio_uio_resid_add(uiop, -(DIRBLKSIZ));
3545		uiop->uio_offset += DIRBLKSIZ;
3546	}
3547
3548nfsmout:
3549	if (nd->nd_mrep != NULL)
3550		mbuf_freem(nd->nd_mrep);
3551	return (error);
3552}
3553#endif	/* !APPLE */
3554
3555/*
3556 * Nfs commit rpc
3557 */
3558APPLESTATIC int
3559nfsrpc_commit(vnode_t vp, u_quad_t offset, int cnt, struct ucred *cred,
3560    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
3561{
3562	u_int32_t *tl;
3563	struct nfsrv_descript nfsd, *nd = &nfsd;
3564	nfsattrbit_t attrbits;
3565	int error;
3566	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3567
3568	*attrflagp = 0;
3569	NFSCL_REQSTART(nd, NFSPROC_COMMIT, vp);
3570	NFSM_BUILD(tl, u_int32_t *, 3 * NFSX_UNSIGNED);
3571	txdr_hyper(offset, tl);
3572	tl += 2;
3573	*tl = txdr_unsigned(cnt);
3574	if (nd->nd_flag & ND_NFSV4) {
3575		/*
3576		 * And do a Getattr op.
3577		 */
3578		NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
3579		*tl = txdr_unsigned(NFSV4OP_GETATTR);
3580		NFSGETATTR_ATTRBIT(&attrbits);
3581		(void) nfsrv_putattrbit(nd, &attrbits);
3582	}
3583	error = nfscl_request(nd, vp, p, cred, stuff);
3584	if (error)
3585		return (error);
3586	error = nfscl_wcc_data(nd, vp, nap, attrflagp, NULL, stuff);
3587	if (!error && !nd->nd_repstat) {
3588		NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
3589		NFSLOCKMNT(nmp);
3590		if (NFSBCMP(nmp->nm_verf, tl, NFSX_VERF)) {
3591			NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
3592			nd->nd_repstat = NFSERR_STALEWRITEVERF;
3593		}
3594		NFSUNLOCKMNT(nmp);
3595		if (nd->nd_flag & ND_NFSV4)
3596			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
3597	}
3598nfsmout:
3599	if (!error && nd->nd_repstat)
3600		error = nd->nd_repstat;
3601	mbuf_freem(nd->nd_mrep);
3602	return (error);
3603}
3604
3605/*
3606 * NFS byte range lock rpc.
3607 * (Mostly just calls one of the three lower level RPC routines.)
3608 */
3609APPLESTATIC int
3610nfsrpc_advlock(vnode_t vp, off_t size, int op, struct flock *fl,
3611    int reclaim, struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3612{
3613	struct nfscllockowner *lp;
3614	struct nfsclclient *clp;
3615	struct nfsfh *nfhp;
3616	struct nfsrv_descript nfsd, *nd = &nfsd;
3617	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
3618	u_int64_t off, len;
3619	off_t start, end;
3620	u_int32_t clidrev = 0;
3621	int error = 0, newone = 0, expireret = 0, retrycnt, donelocally;
3622	int callcnt, dorpc;
3623
3624	/*
3625	 * Convert the flock structure into a start and end and do POSIX
3626	 * bounds checking.
3627	 */
3628	switch (fl->l_whence) {
3629	case SEEK_SET:
3630	case SEEK_CUR:
3631		/*
3632		 * Caller is responsible for adding any necessary offset
3633		 * when SEEK_CUR is used.
3634		 */
3635		start = fl->l_start;
3636		off = fl->l_start;
3637		break;
3638	case SEEK_END:
3639		start = size + fl->l_start;
3640		off = size + fl->l_start;
3641		break;
3642	default:
3643		return (EINVAL);
3644	};
3645	if (start < 0)
3646		return (EINVAL);
3647	if (fl->l_len != 0) {
3648		end = start + fl->l_len - 1;
3649		if (end < start)
3650			return (EINVAL);
3651	}
3652
3653	len = fl->l_len;
3654	if (len == 0)
3655		len = NFS64BITSSET;
3656	retrycnt = 0;
3657	do {
3658	    nd->nd_repstat = 0;
3659	    if (op == F_GETLK) {
3660		error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3661		if (error)
3662			return (error);
3663		error = nfscl_lockt(vp, clp, off, len, fl, p, id, flags);
3664		if (!error) {
3665			clidrev = clp->nfsc_clientidrev;
3666			error = nfsrpc_lockt(nd, vp, clp, off, len, fl, cred,
3667			    p, id, flags);
3668		} else if (error == -1) {
3669			error = 0;
3670		}
3671		nfscl_clientrelease(clp);
3672	    } else if (op == F_UNLCK && fl->l_type == F_UNLCK) {
3673		/*
3674		 * We must loop around for all lockowner cases.
3675		 */
3676		callcnt = 0;
3677		error = nfscl_getcl(vnode_mount(vp), cred, p, 1, &clp);
3678		if (error)
3679			return (error);
3680		do {
3681		    error = nfscl_relbytelock(vp, off, len, cred, p, callcnt,
3682			clp, id, flags, &lp, &dorpc);
3683		    /*
3684		     * If it returns a NULL lp, we're done.
3685		     */
3686		    if (lp == NULL) {
3687			if (callcnt == 0)
3688			    nfscl_clientrelease(clp);
3689			else
3690			    nfscl_releasealllocks(clp, vp, p, id, flags);
3691			return (error);
3692		    }
3693		    if (nmp->nm_clp != NULL)
3694			clidrev = nmp->nm_clp->nfsc_clientidrev;
3695		    else
3696			clidrev = 0;
3697		    /*
3698		     * If the server doesn't support Posix lock semantics,
3699		     * only allow locks on the entire file, since it won't
3700		     * handle overlapping byte ranges.
3701		     * There might still be a problem when a lock
3702		     * upgrade/downgrade (read<->write) occurs, since the
3703		     * server "might" expect an unlock first?
3704		     */
3705		    if (dorpc && (lp->nfsl_open->nfso_posixlock ||
3706			(off == 0 && len == NFS64BITSSET))) {
3707			/*
3708			 * Since the lock records will go away, we must
3709			 * wait for grace and delay here.
3710			 */
3711			do {
3712			    error = nfsrpc_locku(nd, nmp, lp, off, len,
3713				NFSV4LOCKT_READ, cred, p, 0);
3714			    if ((nd->nd_repstat == NFSERR_GRACE ||
3715				 nd->nd_repstat == NFSERR_DELAY) &&
3716				error == 0)
3717				(void) nfs_catnap(PZERO, (int)nd->nd_repstat,
3718				    "nfs_advlock");
3719			} while ((nd->nd_repstat == NFSERR_GRACE ||
3720			    nd->nd_repstat == NFSERR_DELAY) && error == 0);
3721		    }
3722		    callcnt++;
3723		} while (error == 0 && nd->nd_repstat == 0);
3724		nfscl_releasealllocks(clp, vp, p, id, flags);
3725	    } else if (op == F_SETLK) {
3726		error = nfscl_getbytelock(vp, off, len, fl->l_type, cred, p,
3727		    NULL, 0, id, flags, NULL, NULL, &lp, &newone, &donelocally);
3728		if (error || donelocally) {
3729			return (error);
3730		}
3731		if (nmp->nm_clp != NULL)
3732			clidrev = nmp->nm_clp->nfsc_clientidrev;
3733		else
3734			clidrev = 0;
3735		nfhp = VTONFS(vp)->n_fhp;
3736		if (!lp->nfsl_open->nfso_posixlock &&
3737		    (off != 0 || len != NFS64BITSSET)) {
3738			error = EINVAL;
3739		} else {
3740			error = nfsrpc_lock(nd, nmp, vp, nfhp->nfh_fh,
3741			    nfhp->nfh_len, lp, newone, reclaim, off,
3742			    len, fl->l_type, cred, p, 0);
3743		}
3744		if (!error)
3745			error = nd->nd_repstat;
3746		nfscl_lockrelease(lp, error, newone);
3747	    } else {
3748		error = EINVAL;
3749	    }
3750	    if (!error)
3751	        error = nd->nd_repstat;
3752	    if (error == NFSERR_GRACE || error == NFSERR_STALESTATEID ||
3753		error == NFSERR_STALEDONTRECOVER ||
3754		error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3755		error == NFSERR_BADSESSION) {
3756		(void) nfs_catnap(PZERO, error, "nfs_advlock");
3757	    } else if ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID)
3758		&& clidrev != 0) {
3759		expireret = nfscl_hasexpired(nmp->nm_clp, clidrev, p);
3760		retrycnt++;
3761	    }
3762	} while (error == NFSERR_GRACE ||
3763	    error == NFSERR_STALECLIENTID || error == NFSERR_DELAY ||
3764	    error == NFSERR_STALEDONTRECOVER || error == NFSERR_STALESTATEID ||
3765	    error == NFSERR_BADSESSION ||
3766	    ((error == NFSERR_EXPIRED || error == NFSERR_BADSTATEID) &&
3767	     expireret == 0 && clidrev != 0 && retrycnt < 4));
3768	if (error && retrycnt >= 4)
3769		error = EIO;
3770	return (error);
3771}
3772
3773/*
3774 * The lower level routine for the LockT case.
3775 */
3776APPLESTATIC int
3777nfsrpc_lockt(struct nfsrv_descript *nd, vnode_t vp,
3778    struct nfsclclient *clp, u_int64_t off, u_int64_t len, struct flock *fl,
3779    struct ucred *cred, NFSPROC_T *p, void *id, int flags)
3780{
3781	u_int32_t *tl;
3782	int error, type, size;
3783	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3784	struct nfsnode *np;
3785	struct nfsmount *nmp;
3786
3787	nmp = VFSTONFS(vp->v_mount);
3788	NFSCL_REQSTART(nd, NFSPROC_LOCKT, vp);
3789	NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3790	if (fl->l_type == F_RDLCK)
3791		*tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3792	else
3793		*tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3794	txdr_hyper(off, tl);
3795	tl += 2;
3796	txdr_hyper(len, tl);
3797	tl += 2;
3798	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3799	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3800	nfscl_filllockowner(id, own, flags);
3801	np = VTONFS(vp);
3802	NFSBCOPY(np->n_fhp->nfh_fh, &own[NFSV4CL_LOCKNAMELEN],
3803	    np->n_fhp->nfh_len);
3804	(void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + np->n_fhp->nfh_len);
3805	error = nfscl_request(nd, vp, p, cred, NULL);
3806	if (error)
3807		return (error);
3808	if (nd->nd_repstat == 0) {
3809		fl->l_type = F_UNLCK;
3810	} else if (nd->nd_repstat == NFSERR_DENIED) {
3811		nd->nd_repstat = 0;
3812		fl->l_whence = SEEK_SET;
3813		NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3814		fl->l_start = fxdr_hyper(tl);
3815		tl += 2;
3816		len = fxdr_hyper(tl);
3817		tl += 2;
3818		if (len == NFS64BITSSET)
3819			fl->l_len = 0;
3820		else
3821			fl->l_len = len;
3822		type = fxdr_unsigned(int, *tl++);
3823		if (type == NFSV4LOCKT_WRITE)
3824			fl->l_type = F_WRLCK;
3825		else
3826			fl->l_type = F_RDLCK;
3827		/*
3828		 * XXX For now, I have no idea what to do with the
3829		 * conflicting lock_owner, so I'll just set the pid == 0
3830		 * and skip over the lock_owner.
3831		 */
3832		fl->l_pid = (pid_t)0;
3833		tl += 2;
3834		size = fxdr_unsigned(int, *tl);
3835		if (size < 0 || size > NFSV4_OPAQUELIMIT)
3836			error = EBADRPC;
3837		if (!error)
3838			error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3839	} else if (nd->nd_repstat == NFSERR_STALECLIENTID ||
3840	    nd->nd_repstat == NFSERR_BADSESSION)
3841		nfscl_initiate_recovery(clp);
3842nfsmout:
3843	mbuf_freem(nd->nd_mrep);
3844	return (error);
3845}
3846
3847/*
3848 * Lower level function that performs the LockU RPC.
3849 */
3850static int
3851nfsrpc_locku(struct nfsrv_descript *nd, struct nfsmount *nmp,
3852    struct nfscllockowner *lp, u_int64_t off, u_int64_t len,
3853    u_int32_t type, struct ucred *cred, NFSPROC_T *p, int syscred)
3854{
3855	u_int32_t *tl;
3856	int error;
3857
3858	nfscl_reqstart(nd, NFSPROC_LOCKU, nmp, lp->nfsl_open->nfso_fh,
3859	    lp->nfsl_open->nfso_fhlen, NULL, NULL);
3860	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + 6 * NFSX_UNSIGNED);
3861	*tl++ = txdr_unsigned(type);
3862	*tl = txdr_unsigned(lp->nfsl_seqid);
3863	if (nfstest_outofseq &&
3864	    (arc4random() % nfstest_outofseq) == 0)
3865		*tl = txdr_unsigned(lp->nfsl_seqid + 1);
3866	tl++;
3867	if (NFSHASNFSV4N(nmp))
3868		*tl++ = 0;
3869	else
3870		*tl++ = lp->nfsl_stateid.seqid;
3871	*tl++ = lp->nfsl_stateid.other[0];
3872	*tl++ = lp->nfsl_stateid.other[1];
3873	*tl++ = lp->nfsl_stateid.other[2];
3874	txdr_hyper(off, tl);
3875	tl += 2;
3876	txdr_hyper(len, tl);
3877	if (syscred)
3878		nd->nd_flag |= ND_USEGSSNAME;
3879	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
3880	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3881	NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3882	if (error)
3883		return (error);
3884	if (nd->nd_repstat == 0) {
3885		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3886		lp->nfsl_stateid.seqid = *tl++;
3887		lp->nfsl_stateid.other[0] = *tl++;
3888		lp->nfsl_stateid.other[1] = *tl++;
3889		lp->nfsl_stateid.other[2] = *tl;
3890	} else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3891	    nd->nd_repstat == NFSERR_BADSESSION)
3892		nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3893nfsmout:
3894	mbuf_freem(nd->nd_mrep);
3895	return (error);
3896}
3897
3898/*
3899 * The actual Lock RPC.
3900 */
3901APPLESTATIC int
3902nfsrpc_lock(struct nfsrv_descript *nd, struct nfsmount *nmp, vnode_t vp,
3903    u_int8_t *nfhp, int fhlen, struct nfscllockowner *lp, int newone,
3904    int reclaim, u_int64_t off, u_int64_t len, short type, struct ucred *cred,
3905    NFSPROC_T *p, int syscred)
3906{
3907	u_int32_t *tl;
3908	int error, size;
3909	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
3910
3911	nfscl_reqstart(nd, NFSPROC_LOCK, nmp, nfhp, fhlen, NULL, NULL);
3912	NFSM_BUILD(tl, u_int32_t *, 7 * NFSX_UNSIGNED);
3913	if (type == F_RDLCK)
3914		*tl++ = txdr_unsigned(NFSV4LOCKT_READ);
3915	else
3916		*tl++ = txdr_unsigned(NFSV4LOCKT_WRITE);
3917	*tl++ = txdr_unsigned(reclaim);
3918	txdr_hyper(off, tl);
3919	tl += 2;
3920	txdr_hyper(len, tl);
3921	tl += 2;
3922	if (newone) {
3923	    *tl = newnfs_true;
3924	    NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID +
3925		2 * NFSX_UNSIGNED + NFSX_HYPER);
3926	    *tl++ = txdr_unsigned(lp->nfsl_open->nfso_own->nfsow_seqid);
3927	    if (NFSHASNFSV4N(nmp))
3928		*tl++ = 0;
3929	    else
3930		*tl++ = lp->nfsl_open->nfso_stateid.seqid;
3931	    *tl++ = lp->nfsl_open->nfso_stateid.other[0];
3932	    *tl++ = lp->nfsl_open->nfso_stateid.other[1];
3933	    *tl++ = lp->nfsl_open->nfso_stateid.other[2];
3934	    *tl++ = txdr_unsigned(lp->nfsl_seqid);
3935	    *tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
3936	    *tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
3937	    NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
3938	    NFSBCOPY(nfhp, &own[NFSV4CL_LOCKNAMELEN], fhlen);
3939	    (void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
3940	} else {
3941	    *tl = newnfs_false;
3942	    NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID + NFSX_UNSIGNED);
3943	    if (NFSHASNFSV4N(nmp))
3944		*tl++ = 0;
3945	    else
3946		*tl++ = lp->nfsl_stateid.seqid;
3947	    *tl++ = lp->nfsl_stateid.other[0];
3948	    *tl++ = lp->nfsl_stateid.other[1];
3949	    *tl++ = lp->nfsl_stateid.other[2];
3950	    *tl = txdr_unsigned(lp->nfsl_seqid);
3951	    if (nfstest_outofseq &&
3952		(arc4random() % nfstest_outofseq) == 0)
3953		    *tl = txdr_unsigned(lp->nfsl_seqid + 1);
3954	}
3955	if (syscred)
3956		nd->nd_flag |= ND_USEGSSNAME;
3957	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, vp, p, cred,
3958	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
3959	if (error)
3960		return (error);
3961	if (newone)
3962	    NFSCL_INCRSEQID(lp->nfsl_open->nfso_own->nfsow_seqid, nd);
3963	NFSCL_INCRSEQID(lp->nfsl_seqid, nd);
3964	if (nd->nd_repstat == 0) {
3965		NFSM_DISSECT(tl, u_int32_t *, NFSX_STATEID);
3966		lp->nfsl_stateid.seqid = *tl++;
3967		lp->nfsl_stateid.other[0] = *tl++;
3968		lp->nfsl_stateid.other[1] = *tl++;
3969		lp->nfsl_stateid.other[2] = *tl;
3970	} else if (nd->nd_repstat == NFSERR_DENIED) {
3971		NFSM_DISSECT(tl, u_int32_t *, 8 * NFSX_UNSIGNED);
3972		size = fxdr_unsigned(int, *(tl + 7));
3973		if (size < 0 || size > NFSV4_OPAQUELIMIT)
3974			error = EBADRPC;
3975		if (!error)
3976			error = nfsm_advance(nd, NFSM_RNDUP(size), -1);
3977	} else if (nd->nd_repstat == NFSERR_STALESTATEID ||
3978	    nd->nd_repstat == NFSERR_BADSESSION)
3979		nfscl_initiate_recovery(lp->nfsl_open->nfso_own->nfsow_clp);
3980nfsmout:
3981	mbuf_freem(nd->nd_mrep);
3982	return (error);
3983}
3984
3985/*
3986 * nfs statfs rpc
3987 * (always called with the vp for the mount point)
3988 */
3989APPLESTATIC int
3990nfsrpc_statfs(vnode_t vp, struct nfsstatfs *sbp, struct nfsfsinfo *fsp,
3991    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
3992    void *stuff)
3993{
3994	u_int32_t *tl = NULL;
3995	struct nfsrv_descript nfsd, *nd = &nfsd;
3996	struct nfsmount *nmp;
3997	nfsattrbit_t attrbits;
3998	int error;
3999
4000	*attrflagp = 0;
4001	nmp = VFSTONFS(vnode_mount(vp));
4002	if (NFSHASNFSV4(nmp)) {
4003		/*
4004		 * For V4, you actually do a getattr.
4005		 */
4006		NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4007		NFSSTATFS_GETATTRBIT(&attrbits);
4008		(void) nfsrv_putattrbit(nd, &attrbits);
4009		nd->nd_flag |= ND_USEGSSNAME;
4010		error = nfscl_request(nd, vp, p, cred, stuff);
4011		if (error)
4012			return (error);
4013		if (nd->nd_repstat == 0) {
4014			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4015			    NULL, NULL, sbp, fsp, NULL, 0, NULL, NULL, NULL, p,
4016			    cred);
4017			if (!error) {
4018				nmp->nm_fsid[0] = nap->na_filesid[0];
4019				nmp->nm_fsid[1] = nap->na_filesid[1];
4020				NFSSETHASSETFSID(nmp);
4021				*attrflagp = 1;
4022			}
4023		} else {
4024			error = nd->nd_repstat;
4025		}
4026		if (error)
4027			goto nfsmout;
4028	} else {
4029		NFSCL_REQSTART(nd, NFSPROC_FSSTAT, vp);
4030		error = nfscl_request(nd, vp, p, cred, stuff);
4031		if (error)
4032			return (error);
4033		if (nd->nd_flag & ND_NFSV3) {
4034			error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4035			if (error)
4036				goto nfsmout;
4037		}
4038		if (nd->nd_repstat) {
4039			error = nd->nd_repstat;
4040			goto nfsmout;
4041		}
4042		NFSM_DISSECT(tl, u_int32_t *,
4043		    NFSX_STATFS(nd->nd_flag & ND_NFSV3));
4044	}
4045	if (NFSHASNFSV3(nmp)) {
4046		sbp->sf_tbytes = fxdr_hyper(tl); tl += 2;
4047		sbp->sf_fbytes = fxdr_hyper(tl); tl += 2;
4048		sbp->sf_abytes = fxdr_hyper(tl); tl += 2;
4049		sbp->sf_tfiles = fxdr_hyper(tl); tl += 2;
4050		sbp->sf_ffiles = fxdr_hyper(tl); tl += 2;
4051		sbp->sf_afiles = fxdr_hyper(tl); tl += 2;
4052		sbp->sf_invarsec = fxdr_unsigned(u_int32_t, *tl);
4053	} else if (NFSHASNFSV4(nmp) == 0) {
4054		sbp->sf_tsize = fxdr_unsigned(u_int32_t, *tl++);
4055		sbp->sf_bsize = fxdr_unsigned(u_int32_t, *tl++);
4056		sbp->sf_blocks = fxdr_unsigned(u_int32_t, *tl++);
4057		sbp->sf_bfree = fxdr_unsigned(u_int32_t, *tl++);
4058		sbp->sf_bavail = fxdr_unsigned(u_int32_t, *tl);
4059	}
4060nfsmout:
4061	mbuf_freem(nd->nd_mrep);
4062	return (error);
4063}
4064
4065/*
4066 * nfs pathconf rpc
4067 */
4068APPLESTATIC int
4069nfsrpc_pathconf(vnode_t vp, struct nfsv3_pathconf *pc,
4070    struct ucred *cred, NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp,
4071    void *stuff)
4072{
4073	struct nfsrv_descript nfsd, *nd = &nfsd;
4074	struct nfsmount *nmp;
4075	u_int32_t *tl;
4076	nfsattrbit_t attrbits;
4077	int error;
4078
4079	*attrflagp = 0;
4080	nmp = VFSTONFS(vnode_mount(vp));
4081	if (NFSHASNFSV4(nmp)) {
4082		/*
4083		 * For V4, you actually do a getattr.
4084		 */
4085		NFSCL_REQSTART(nd, NFSPROC_GETATTR, vp);
4086		NFSPATHCONF_GETATTRBIT(&attrbits);
4087		(void) nfsrv_putattrbit(nd, &attrbits);
4088		nd->nd_flag |= ND_USEGSSNAME;
4089		error = nfscl_request(nd, vp, p, cred, stuff);
4090		if (error)
4091			return (error);
4092		if (nd->nd_repstat == 0) {
4093			error = nfsv4_loadattr(nd, NULL, nap, NULL, NULL, 0,
4094			    pc, NULL, NULL, NULL, NULL, 0, NULL, NULL, NULL, p,
4095			    cred);
4096			if (!error)
4097				*attrflagp = 1;
4098		} else {
4099			error = nd->nd_repstat;
4100		}
4101	} else {
4102		NFSCL_REQSTART(nd, NFSPROC_PATHCONF, vp);
4103		error = nfscl_request(nd, vp, p, cred, stuff);
4104		if (error)
4105			return (error);
4106		error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4107		if (nd->nd_repstat && !error)
4108			error = nd->nd_repstat;
4109		if (!error) {
4110			NFSM_DISSECT(tl, u_int32_t *, NFSX_V3PATHCONF);
4111			pc->pc_linkmax = fxdr_unsigned(u_int32_t, *tl++);
4112			pc->pc_namemax = fxdr_unsigned(u_int32_t, *tl++);
4113			pc->pc_notrunc = fxdr_unsigned(u_int32_t, *tl++);
4114			pc->pc_chownrestricted =
4115			    fxdr_unsigned(u_int32_t, *tl++);
4116			pc->pc_caseinsensitive =
4117			    fxdr_unsigned(u_int32_t, *tl++);
4118			pc->pc_casepreserving = fxdr_unsigned(u_int32_t, *tl);
4119		}
4120	}
4121nfsmout:
4122	mbuf_freem(nd->nd_mrep);
4123	return (error);
4124}
4125
4126/*
4127 * nfs version 3 fsinfo rpc call
4128 */
4129APPLESTATIC int
4130nfsrpc_fsinfo(vnode_t vp, struct nfsfsinfo *fsp, struct ucred *cred,
4131    NFSPROC_T *p, struct nfsvattr *nap, int *attrflagp, void *stuff)
4132{
4133	u_int32_t *tl;
4134	struct nfsrv_descript nfsd, *nd = &nfsd;
4135	int error;
4136
4137	*attrflagp = 0;
4138	NFSCL_REQSTART(nd, NFSPROC_FSINFO, vp);
4139	error = nfscl_request(nd, vp, p, cred, stuff);
4140	if (error)
4141		return (error);
4142	error = nfscl_postop_attr(nd, nap, attrflagp, stuff);
4143	if (nd->nd_repstat && !error)
4144		error = nd->nd_repstat;
4145	if (!error) {
4146		NFSM_DISSECT(tl, u_int32_t *, NFSX_V3FSINFO);
4147		fsp->fs_rtmax = fxdr_unsigned(u_int32_t, *tl++);
4148		fsp->fs_rtpref = fxdr_unsigned(u_int32_t, *tl++);
4149		fsp->fs_rtmult = fxdr_unsigned(u_int32_t, *tl++);
4150		fsp->fs_wtmax = fxdr_unsigned(u_int32_t, *tl++);
4151		fsp->fs_wtpref = fxdr_unsigned(u_int32_t, *tl++);
4152		fsp->fs_wtmult = fxdr_unsigned(u_int32_t, *tl++);
4153		fsp->fs_dtpref = fxdr_unsigned(u_int32_t, *tl++);
4154		fsp->fs_maxfilesize = fxdr_hyper(tl);
4155		tl += 2;
4156		fxdr_nfsv3time(tl, &fsp->fs_timedelta);
4157		tl += 2;
4158		fsp->fs_properties = fxdr_unsigned(u_int32_t, *tl);
4159	}
4160nfsmout:
4161	mbuf_freem(nd->nd_mrep);
4162	return (error);
4163}
4164
4165/*
4166 * This function performs the Renew RPC.
4167 */
4168APPLESTATIC int
4169nfsrpc_renew(struct nfsclclient *clp, struct nfsclds *dsp, struct ucred *cred,
4170    NFSPROC_T *p)
4171{
4172	u_int32_t *tl;
4173	struct nfsrv_descript nfsd;
4174	struct nfsrv_descript *nd = &nfsd;
4175	struct nfsmount *nmp;
4176	int error;
4177	struct nfssockreq *nrp;
4178
4179	nmp = clp->nfsc_nmp;
4180	if (nmp == NULL)
4181		return (0);
4182	nfscl_reqstart(nd, NFSPROC_RENEW, nmp, NULL, 0, NULL,
4183	    &dsp->nfsclds_sess);
4184	if (!NFSHASNFSV4N(nmp)) {
4185		/* NFSv4.1 just uses a Sequence Op and not a Renew. */
4186		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4187		*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4188		*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4189	}
4190	nrp = dsp->nfsclds_sockp;
4191	if (nrp == NULL)
4192		/* If NULL, use the MDS socket. */
4193		nrp = &nmp->nm_sockreq;
4194	nd->nd_flag |= ND_USEGSSNAME;
4195	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4196	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
4197	if (error)
4198		return (error);
4199	error = nd->nd_repstat;
4200	mbuf_freem(nd->nd_mrep);
4201	return (error);
4202}
4203
4204/*
4205 * This function performs the Releaselockowner RPC.
4206 */
4207APPLESTATIC int
4208nfsrpc_rellockown(struct nfsmount *nmp, struct nfscllockowner *lp,
4209    uint8_t *fh, int fhlen, struct ucred *cred, NFSPROC_T *p)
4210{
4211	struct nfsrv_descript nfsd, *nd = &nfsd;
4212	u_int32_t *tl;
4213	int error;
4214	uint8_t own[NFSV4CL_LOCKNAMELEN + NFSX_V4FHMAX];
4215
4216	if (NFSHASNFSV4N(nmp)) {
4217		/* For NFSv4.1, do a FreeStateID. */
4218		nfscl_reqstart(nd, NFSPROC_FREESTATEID, nmp, NULL, 0, NULL,
4219		    NULL);
4220		nfsm_stateidtom(nd, &lp->nfsl_stateid, NFSSTATEID_PUTSTATEID);
4221	} else {
4222		nfscl_reqstart(nd, NFSPROC_RELEASELCKOWN, nmp, NULL, 0, NULL,
4223		    NULL);
4224		NFSM_BUILD(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
4225		*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4226		*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4227		NFSBCOPY(lp->nfsl_owner, own, NFSV4CL_LOCKNAMELEN);
4228		NFSBCOPY(fh, &own[NFSV4CL_LOCKNAMELEN], fhlen);
4229		(void)nfsm_strtom(nd, own, NFSV4CL_LOCKNAMELEN + fhlen);
4230	}
4231	nd->nd_flag |= ND_USEGSSNAME;
4232	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4233	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4234	if (error)
4235		return (error);
4236	error = nd->nd_repstat;
4237	mbuf_freem(nd->nd_mrep);
4238	return (error);
4239}
4240
4241/*
4242 * This function performs the Compound to get the mount pt FH.
4243 */
4244APPLESTATIC int
4245nfsrpc_getdirpath(struct nfsmount *nmp, u_char *dirpath, struct ucred *cred,
4246    NFSPROC_T *p)
4247{
4248	u_int32_t *tl;
4249	struct nfsrv_descript nfsd;
4250	struct nfsrv_descript *nd = &nfsd;
4251	u_char *cp, *cp2;
4252	int error, cnt, len, setnil;
4253	u_int32_t *opcntp;
4254
4255	nfscl_reqstart(nd, NFSPROC_PUTROOTFH, nmp, NULL, 0, &opcntp, NULL);
4256	cp = dirpath;
4257	cnt = 0;
4258	do {
4259		setnil = 0;
4260		while (*cp == '/')
4261			cp++;
4262		cp2 = cp;
4263		while (*cp2 != '\0' && *cp2 != '/')
4264			cp2++;
4265		if (*cp2 == '/') {
4266			setnil = 1;
4267			*cp2 = '\0';
4268		}
4269		if (cp2 != cp) {
4270			NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4271			*tl = txdr_unsigned(NFSV4OP_LOOKUP);
4272			nfsm_strtom(nd, cp, strlen(cp));
4273			cnt++;
4274		}
4275		if (setnil)
4276			*cp2++ = '/';
4277		cp = cp2;
4278	} while (*cp != '\0');
4279	if (NFSHASNFSV4N(nmp))
4280		/* Has a Sequence Op done by nfscl_reqstart(). */
4281		*opcntp = txdr_unsigned(3 + cnt);
4282	else
4283		*opcntp = txdr_unsigned(2 + cnt);
4284	NFSM_BUILD(tl, u_int32_t *, NFSX_UNSIGNED);
4285	*tl = txdr_unsigned(NFSV4OP_GETFH);
4286	nd->nd_flag |= ND_USEGSSNAME;
4287	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4288		NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4289	if (error)
4290		return (error);
4291	if (nd->nd_repstat == 0) {
4292		NFSM_DISSECT(tl, u_int32_t *, (3 + 2 * cnt) * NFSX_UNSIGNED);
4293		tl += (2 + 2 * cnt);
4294		if ((len = fxdr_unsigned(int, *tl)) <= 0 ||
4295			len > NFSX_FHMAX) {
4296			nd->nd_repstat = NFSERR_BADXDR;
4297		} else {
4298			nd->nd_repstat = nfsrv_mtostr(nd, nmp->nm_fh, len);
4299			if (nd->nd_repstat == 0)
4300				nmp->nm_fhsize = len;
4301		}
4302	}
4303	error = nd->nd_repstat;
4304nfsmout:
4305	mbuf_freem(nd->nd_mrep);
4306	return (error);
4307}
4308
4309/*
4310 * This function performs the Delegreturn RPC.
4311 */
4312APPLESTATIC int
4313nfsrpc_delegreturn(struct nfscldeleg *dp, struct ucred *cred,
4314    struct nfsmount *nmp, NFSPROC_T *p, int syscred)
4315{
4316	u_int32_t *tl;
4317	struct nfsrv_descript nfsd;
4318	struct nfsrv_descript *nd = &nfsd;
4319	int error;
4320
4321	nfscl_reqstart(nd, NFSPROC_DELEGRETURN, nmp, dp->nfsdl_fh,
4322	    dp->nfsdl_fhlen, NULL, NULL);
4323	NFSM_BUILD(tl, u_int32_t *, NFSX_STATEID);
4324	if (NFSHASNFSV4N(nmp))
4325		*tl++ = 0;
4326	else
4327		*tl++ = dp->nfsdl_stateid.seqid;
4328	*tl++ = dp->nfsdl_stateid.other[0];
4329	*tl++ = dp->nfsdl_stateid.other[1];
4330	*tl = dp->nfsdl_stateid.other[2];
4331	if (syscred)
4332		nd->nd_flag |= ND_USEGSSNAME;
4333	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4334	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4335	if (error)
4336		return (error);
4337	error = nd->nd_repstat;
4338	mbuf_freem(nd->nd_mrep);
4339	return (error);
4340}
4341
4342/*
4343 * nfs getacl call.
4344 */
4345APPLESTATIC int
4346nfsrpc_getacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4347    struct acl *aclp, void *stuff)
4348{
4349	struct nfsrv_descript nfsd, *nd = &nfsd;
4350	int error;
4351	nfsattrbit_t attrbits;
4352	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4353
4354	if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4355		return (EOPNOTSUPP);
4356	NFSCL_REQSTART(nd, NFSPROC_GETACL, vp);
4357	NFSZERO_ATTRBIT(&attrbits);
4358	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4359	(void) nfsrv_putattrbit(nd, &attrbits);
4360	error = nfscl_request(nd, vp, p, cred, stuff);
4361	if (error)
4362		return (error);
4363	if (!nd->nd_repstat)
4364		error = nfsv4_loadattr(nd, vp, NULL, NULL, NULL, 0, NULL,
4365		    NULL, NULL, NULL, aclp, 0, NULL, NULL, NULL, p, cred);
4366	else
4367		error = nd->nd_repstat;
4368	mbuf_freem(nd->nd_mrep);
4369	return (error);
4370}
4371
4372/*
4373 * nfs setacl call.
4374 */
4375APPLESTATIC int
4376nfsrpc_setacl(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4377    struct acl *aclp, void *stuff)
4378{
4379	int error;
4380	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4381
4382	if (nfsrv_useacl == 0 || !NFSHASNFSV4(nmp))
4383		return (EOPNOTSUPP);
4384	error = nfsrpc_setattr(vp, NULL, aclp, cred, p, NULL, NULL, stuff);
4385	return (error);
4386}
4387
4388/*
4389 * nfs setacl call.
4390 */
4391static int
4392nfsrpc_setaclrpc(vnode_t vp, struct ucred *cred, NFSPROC_T *p,
4393    struct acl *aclp, nfsv4stateid_t *stateidp, void *stuff)
4394{
4395	struct nfsrv_descript nfsd, *nd = &nfsd;
4396	int error;
4397	nfsattrbit_t attrbits;
4398	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
4399
4400	if (!NFSHASNFSV4(nmp))
4401		return (EOPNOTSUPP);
4402	NFSCL_REQSTART(nd, NFSPROC_SETACL, vp);
4403	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSTATEID);
4404	NFSZERO_ATTRBIT(&attrbits);
4405	NFSSETBIT_ATTRBIT(&attrbits, NFSATTRBIT_ACL);
4406	(void) nfsv4_fillattr(nd, vnode_mount(vp), vp, aclp, NULL, NULL, 0,
4407	    &attrbits, NULL, NULL, 0, 0, 0, 0, (uint64_t)0);
4408	error = nfscl_request(nd, vp, p, cred, stuff);
4409	if (error)
4410		return (error);
4411	/* Don't care about the pre/postop attributes */
4412	mbuf_freem(nd->nd_mrep);
4413	return (nd->nd_repstat);
4414}
4415
4416/*
4417 * Do the NFSv4.1 Exchange ID.
4418 */
4419int
4420nfsrpc_exchangeid(struct nfsmount *nmp, struct nfsclclient *clp,
4421    struct nfssockreq *nrp, uint32_t exchflags, struct nfsclds **dspp,
4422    struct ucred *cred, NFSPROC_T *p)
4423{
4424	uint32_t *tl, v41flags;
4425	struct nfsrv_descript nfsd;
4426	struct nfsrv_descript *nd = &nfsd;
4427	struct nfsclds *dsp;
4428	struct timespec verstime;
4429	int error, len;
4430
4431	*dspp = NULL;
4432	nfscl_reqstart(nd, NFSPROC_EXCHANGEID, nmp, NULL, 0, NULL, NULL);
4433	NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4434	*tl++ = txdr_unsigned(nfsboottime.tv_sec);	/* Client owner */
4435	*tl = txdr_unsigned(clp->nfsc_rev);
4436	(void) nfsm_strtom(nd, clp->nfsc_id, clp->nfsc_idlen);
4437
4438	NFSM_BUILD(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4439	*tl++ = txdr_unsigned(exchflags);
4440	*tl++ = txdr_unsigned(NFSV4EXCH_SP4NONE);
4441
4442	/* Set the implementation id4 */
4443	*tl = txdr_unsigned(1);
4444	(void) nfsm_strtom(nd, "freebsd.org", strlen("freebsd.org"));
4445	(void) nfsm_strtom(nd, version, strlen(version));
4446	NFSM_BUILD(tl, uint32_t *, NFSX_V4TIME);
4447	verstime.tv_sec = 1293840000;		/* Jan 1, 2011 */
4448	verstime.tv_nsec = 0;
4449	txdr_nfsv4time(&verstime, tl);
4450	nd->nd_flag |= ND_USEGSSNAME;
4451	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred,
4452	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4453	NFSCL_DEBUG(1, "exchangeid err=%d reps=%d\n", error,
4454	    (int)nd->nd_repstat);
4455	if (error != 0)
4456		return (error);
4457	if (nd->nd_repstat == 0) {
4458		NFSM_DISSECT(tl, uint32_t *, 6 * NFSX_UNSIGNED + NFSX_HYPER);
4459		len = fxdr_unsigned(int, *(tl + 7));
4460		if (len < 0 || len > NFSV4_OPAQUELIMIT) {
4461			error = NFSERR_BADXDR;
4462			goto nfsmout;
4463		}
4464		dsp = malloc(sizeof(struct nfsclds) + len, M_NFSCLDS,
4465		    M_WAITOK | M_ZERO);
4466		dsp->nfsclds_expire = NFSD_MONOSEC + clp->nfsc_renew;
4467		dsp->nfsclds_servownlen = len;
4468		dsp->nfsclds_sess.nfsess_clientid.lval[0] = *tl++;
4469		dsp->nfsclds_sess.nfsess_clientid.lval[1] = *tl++;
4470		dsp->nfsclds_sess.nfsess_sequenceid =
4471		    fxdr_unsigned(uint32_t, *tl++);
4472		v41flags = fxdr_unsigned(uint32_t, *tl);
4473		if ((v41flags & NFSV4EXCH_USEPNFSMDS) != 0 &&
4474		    NFSHASPNFSOPT(nmp)) {
4475			NFSCL_DEBUG(1, "set PNFS\n");
4476			NFSLOCKMNT(nmp);
4477			nmp->nm_state |= NFSSTA_PNFS;
4478			NFSUNLOCKMNT(nmp);
4479			dsp->nfsclds_flags |= NFSCLDS_MDS;
4480		}
4481		if ((v41flags & NFSV4EXCH_USEPNFSDS) != 0)
4482			dsp->nfsclds_flags |= NFSCLDS_DS;
4483		if (len > 0)
4484			nd->nd_repstat = nfsrv_mtostr(nd,
4485			    dsp->nfsclds_serverown, len);
4486		if (nd->nd_repstat == 0) {
4487			mtx_init(&dsp->nfsclds_mtx, "nfsds", NULL, MTX_DEF);
4488			mtx_init(&dsp->nfsclds_sess.nfsess_mtx, "nfssession",
4489			    NULL, MTX_DEF);
4490			nfscl_initsessionslots(&dsp->nfsclds_sess);
4491			*dspp = dsp;
4492		} else
4493			free(dsp, M_NFSCLDS);
4494	}
4495	error = nd->nd_repstat;
4496nfsmout:
4497	mbuf_freem(nd->nd_mrep);
4498	return (error);
4499}
4500
4501/*
4502 * Do the NFSv4.1 Create Session.
4503 */
4504int
4505nfsrpc_createsession(struct nfsmount *nmp, struct nfsclsession *sep,
4506    struct nfssockreq *nrp, uint32_t sequenceid, int mds, struct ucred *cred,
4507    NFSPROC_T *p)
4508{
4509	uint32_t crflags, *tl;
4510	struct nfsrv_descript nfsd;
4511	struct nfsrv_descript *nd = &nfsd;
4512	int error, irdcnt;
4513
4514	nfscl_reqstart(nd, NFSPROC_CREATESESSION, nmp, NULL, 0, NULL, NULL);
4515	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
4516	*tl++ = sep->nfsess_clientid.lval[0];
4517	*tl++ = sep->nfsess_clientid.lval[1];
4518	*tl++ = txdr_unsigned(sequenceid);
4519	crflags = (NFSMNT_RDONLY(nmp->nm_mountp) ? 0 : NFSV4CRSESS_PERSIST);
4520	if (nfscl_enablecallb != 0 && nfs_numnfscbd > 0)
4521		crflags |= NFSV4CRSESS_CONNBACKCHAN;
4522	*tl = txdr_unsigned(crflags);
4523
4524	/* Fill in fore channel attributes. */
4525	NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4526	*tl++ = 0;				/* Header pad size */
4527	*tl++ = txdr_unsigned(100000);		/* Max request size */
4528	*tl++ = txdr_unsigned(100000);		/* Max response size */
4529	*tl++ = txdr_unsigned(4096);		/* Max response size cached */
4530	*tl++ = txdr_unsigned(20);		/* Max operations */
4531	*tl++ = txdr_unsigned(64);		/* Max slots */
4532	*tl = 0;				/* No rdma ird */
4533
4534	/* Fill in back channel attributes. */
4535	NFSM_BUILD(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4536	*tl++ = 0;				/* Header pad size */
4537	*tl++ = txdr_unsigned(10000);		/* Max request size */
4538	*tl++ = txdr_unsigned(10000);		/* Max response size */
4539	*tl++ = txdr_unsigned(4096);		/* Max response size cached */
4540	*tl++ = txdr_unsigned(4);		/* Max operations */
4541	*tl++ = txdr_unsigned(NFSV4_CBSLOTS);	/* Max slots */
4542	*tl = 0;				/* No rdma ird */
4543
4544	NFSM_BUILD(tl, uint32_t *, 8 * NFSX_UNSIGNED);
4545	*tl++ = txdr_unsigned(NFS_CALLBCKPROG);	/* Call back prog # */
4546
4547	/* Allow AUTH_SYS callbacks as uid, gid == 0. */
4548	*tl++ = txdr_unsigned(1);		/* Auth_sys only */
4549	*tl++ = txdr_unsigned(AUTH_SYS);	/* AUTH_SYS type */
4550	*tl++ = txdr_unsigned(nfsboottime.tv_sec); /* time stamp */
4551	*tl++ = 0;				/* Null machine name */
4552	*tl++ = 0;				/* Uid == 0 */
4553	*tl++ = 0;				/* Gid == 0 */
4554	*tl = 0;				/* No additional gids */
4555	nd->nd_flag |= ND_USEGSSNAME;
4556	error = newnfs_request(nd, nmp, NULL, nrp, NULL, p, cred, NFS_PROG,
4557	    NFS_VER4, NULL, 1, NULL, NULL);
4558	if (error != 0)
4559		return (error);
4560	if (nd->nd_repstat == 0) {
4561		NFSM_DISSECT(tl, uint32_t *, NFSX_V4SESSIONID +
4562		    2 * NFSX_UNSIGNED);
4563		bcopy(tl, sep->nfsess_sessionid, NFSX_V4SESSIONID);
4564		tl += NFSX_V4SESSIONID / NFSX_UNSIGNED;
4565		sep->nfsess_sequenceid = fxdr_unsigned(uint32_t, *tl++);
4566		crflags = fxdr_unsigned(uint32_t, *tl);
4567		if ((crflags & NFSV4CRSESS_PERSIST) != 0 && mds != 0) {
4568			NFSLOCKMNT(nmp);
4569			nmp->nm_state |= NFSSTA_SESSPERSIST;
4570			NFSUNLOCKMNT(nmp);
4571		}
4572
4573		/* Get the fore channel slot count. */
4574		NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4575		tl += 3;		/* Skip the other counts. */
4576		sep->nfsess_maxcache = fxdr_unsigned(int, *tl++);
4577		tl++;
4578		sep->nfsess_foreslots = fxdr_unsigned(uint16_t, *tl++);
4579		NFSCL_DEBUG(4, "fore slots=%d\n", (int)sep->nfsess_foreslots);
4580		irdcnt = fxdr_unsigned(int, *tl);
4581		if (irdcnt > 0)
4582			NFSM_DISSECT(tl, uint32_t *, irdcnt * NFSX_UNSIGNED);
4583
4584		/* and the back channel slot count. */
4585		NFSM_DISSECT(tl, uint32_t *, 7 * NFSX_UNSIGNED);
4586		tl += 5;
4587		sep->nfsess_backslots = fxdr_unsigned(uint16_t, *tl);
4588		NFSCL_DEBUG(4, "back slots=%d\n", (int)sep->nfsess_backslots);
4589	}
4590	error = nd->nd_repstat;
4591nfsmout:
4592	mbuf_freem(nd->nd_mrep);
4593	return (error);
4594}
4595
4596/*
4597 * Do the NFSv4.1 Destroy Session.
4598 */
4599int
4600nfsrpc_destroysession(struct nfsmount *nmp, struct nfsclclient *clp,
4601    struct ucred *cred, NFSPROC_T *p)
4602{
4603	uint32_t *tl;
4604	struct nfsrv_descript nfsd;
4605	struct nfsrv_descript *nd = &nfsd;
4606	int error;
4607
4608	nfscl_reqstart(nd, NFSPROC_DESTROYSESSION, nmp, NULL, 0, NULL, NULL);
4609	NFSM_BUILD(tl, uint32_t *, NFSX_V4SESSIONID);
4610	bcopy(NFSMNT_MDSSESSION(nmp)->nfsess_sessionid, tl, NFSX_V4SESSIONID);
4611	nd->nd_flag |= ND_USEGSSNAME;
4612	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4613	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4614	if (error != 0)
4615		return (error);
4616	error = nd->nd_repstat;
4617	mbuf_freem(nd->nd_mrep);
4618	return (error);
4619}
4620
4621/*
4622 * Do the NFSv4.1 Destroy Client.
4623 */
4624int
4625nfsrpc_destroyclient(struct nfsmount *nmp, struct nfsclclient *clp,
4626    struct ucred *cred, NFSPROC_T *p)
4627{
4628	uint32_t *tl;
4629	struct nfsrv_descript nfsd;
4630	struct nfsrv_descript *nd = &nfsd;
4631	int error;
4632
4633	nfscl_reqstart(nd, NFSPROC_DESTROYCLIENT, nmp, NULL, 0, NULL, NULL);
4634	NFSM_BUILD(tl, uint32_t *, 2 * NFSX_UNSIGNED);
4635	*tl++ = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[0];
4636	*tl = NFSMNT_MDSSESSION(nmp)->nfsess_clientid.lval[1];
4637	nd->nd_flag |= ND_USEGSSNAME;
4638	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4639	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4640	if (error != 0)
4641		return (error);
4642	error = nd->nd_repstat;
4643	mbuf_freem(nd->nd_mrep);
4644	return (error);
4645}
4646
4647/*
4648 * Do the NFSv4.1 LayoutGet.
4649 */
4650int
4651nfsrpc_layoutget(struct nfsmount *nmp, uint8_t *fhp, int fhlen, int iomode,
4652    uint64_t offset, uint64_t len, uint64_t minlen, int layoutlen,
4653    nfsv4stateid_t *stateidp, int *retonclosep, struct nfsclflayouthead *flhp,
4654    struct ucred *cred, NFSPROC_T *p, void *stuff)
4655{
4656	uint32_t *tl;
4657	struct nfsrv_descript nfsd, *nd = &nfsd;
4658	struct nfsfh *nfhp;
4659	struct nfsclflayout *flp, *prevflp, *tflp;
4660	int cnt, error, gotiomode, fhcnt, nfhlen, i, j;
4661	uint8_t *cp;
4662	uint64_t retlen;
4663
4664	flp = NULL;
4665	gotiomode = -1;
4666	nfscl_reqstart(nd, NFSPROC_LAYOUTGET, nmp, fhp, fhlen, NULL, NULL);
4667	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4668	    NFSX_STATEID);
4669	*tl++ = newnfs_false;		/* Don't signal availability. */
4670	*tl++ = txdr_unsigned(NFSLAYOUT_NFSV4_1_FILES);
4671	*tl++ = txdr_unsigned(iomode);
4672	txdr_hyper(offset, tl);
4673	tl += 2;
4674	txdr_hyper(len, tl);
4675	tl += 2;
4676	txdr_hyper(minlen, tl);
4677	tl += 2;
4678	*tl++ = txdr_unsigned(stateidp->seqid);
4679	NFSCL_DEBUG(4, "layget seq=%d\n", (int)stateidp->seqid);
4680	*tl++ = stateidp->other[0];
4681	*tl++ = stateidp->other[1];
4682	*tl++ = stateidp->other[2];
4683	*tl = txdr_unsigned(layoutlen);
4684	nd->nd_flag |= ND_USEGSSNAME;
4685	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4686	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4687	if (error != 0)
4688		return (error);
4689	if (nd->nd_repstat == 0) {
4690		NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_STATEID);
4691		if (*tl++ != 0)
4692			*retonclosep = 1;
4693		else
4694			*retonclosep = 0;
4695		stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
4696		NFSCL_DEBUG(4, "retoncls=%d stseq=%d\n", *retonclosep,
4697		    (int)stateidp->seqid);
4698		stateidp->other[0] = *tl++;
4699		stateidp->other[1] = *tl++;
4700		stateidp->other[2] = *tl++;
4701		cnt = fxdr_unsigned(int, *tl);
4702		NFSCL_DEBUG(4, "layg cnt=%d\n", cnt);
4703		if (cnt <= 0 || cnt > 10000) {
4704			/* Don't accept more than 10000 layouts in reply. */
4705			error = NFSERR_BADXDR;
4706			goto nfsmout;
4707		}
4708		for (i = 0; i < cnt; i++) {
4709			/* Dissect all the way to the file handle cnt. */
4710			NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_HYPER +
4711			    6 * NFSX_UNSIGNED + NFSX_V4DEVICEID);
4712			fhcnt = fxdr_unsigned(int, *(tl + 11 +
4713			    NFSX_V4DEVICEID / NFSX_UNSIGNED));
4714			NFSCL_DEBUG(4, "fhcnt=%d\n", fhcnt);
4715			if (fhcnt < 0 || fhcnt > 100) {
4716				/* Don't accept more than 100 file handles. */
4717				error = NFSERR_BADXDR;
4718				goto nfsmout;
4719			}
4720			if (fhcnt > 1)
4721				flp = malloc(sizeof(*flp) + (fhcnt - 1) *
4722				    sizeof(struct nfsfh *),
4723				    M_NFSFLAYOUT, M_WAITOK);
4724			else
4725				flp = malloc(sizeof(*flp),
4726				    M_NFSFLAYOUT, M_WAITOK);
4727			flp->nfsfl_flags = 0;
4728			flp->nfsfl_fhcnt = 0;
4729			flp->nfsfl_devp = NULL;
4730			flp->nfsfl_off = fxdr_hyper(tl); tl += 2;
4731			retlen = fxdr_hyper(tl); tl += 2;
4732			if (flp->nfsfl_off + retlen < flp->nfsfl_off)
4733				flp->nfsfl_end = UINT64_MAX - flp->nfsfl_off;
4734			else
4735				flp->nfsfl_end = flp->nfsfl_off + retlen;
4736			flp->nfsfl_iomode = fxdr_unsigned(int, *tl++);
4737			if (gotiomode == -1)
4738				gotiomode = flp->nfsfl_iomode;
4739			NFSCL_DEBUG(4, "layg reqiom=%d retiom=%d\n", iomode,
4740			    (int)flp->nfsfl_iomode);
4741			if (fxdr_unsigned(int, *tl++) !=
4742			    NFSLAYOUT_NFSV4_1_FILES) {
4743				printf("NFSv4.1: got non-files layout\n");
4744				error = NFSERR_BADXDR;
4745				goto nfsmout;
4746			}
4747			NFSBCOPY(++tl, flp->nfsfl_dev, NFSX_V4DEVICEID);
4748			tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4749			flp->nfsfl_util = fxdr_unsigned(uint32_t, *tl++);
4750			NFSCL_DEBUG(4, "flutil=0x%x\n", flp->nfsfl_util);
4751			flp->nfsfl_stripe1 = fxdr_unsigned(uint32_t, *tl++);
4752			flp->nfsfl_patoff = fxdr_hyper(tl); tl += 2;
4753			if (fxdr_unsigned(int, *tl) != fhcnt) {
4754				printf("EEK! bad fhcnt\n");
4755				error = NFSERR_BADXDR;
4756				goto nfsmout;
4757			}
4758			for (j = 0; j < fhcnt; j++) {
4759				NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4760				nfhlen = fxdr_unsigned(int, *tl);
4761				if (nfhlen <= 0 || nfhlen > NFSX_V4FHMAX) {
4762					error = NFSERR_BADXDR;
4763					goto nfsmout;
4764				}
4765				nfhp = malloc(sizeof(*nfhp) + nfhlen - 1,
4766				    M_NFSFH, M_WAITOK);
4767				flp->nfsfl_fh[j] = nfhp;
4768				flp->nfsfl_fhcnt++;
4769				nfhp->nfh_len = nfhlen;
4770				NFSM_DISSECT(cp, uint8_t *, NFSM_RNDUP(nfhlen));
4771				NFSBCOPY(cp, nfhp->nfh_fh, nfhlen);
4772			}
4773			if (flp->nfsfl_iomode == gotiomode) {
4774				/* Keep the list in increasing offset order. */
4775				tflp = LIST_FIRST(flhp);
4776				prevflp = NULL;
4777				while (tflp != NULL &&
4778				    tflp->nfsfl_off < flp->nfsfl_off) {
4779					prevflp = tflp;
4780					tflp = LIST_NEXT(tflp, nfsfl_list);
4781				}
4782				if (prevflp == NULL)
4783					LIST_INSERT_HEAD(flhp, flp, nfsfl_list);
4784				else
4785					LIST_INSERT_AFTER(prevflp, flp,
4786					    nfsfl_list);
4787			} else {
4788				printf("nfscl_layoutget(): got wrong iomode\n");
4789				nfscl_freeflayout(flp);
4790			}
4791			flp = NULL;
4792		}
4793	}
4794	if (nd->nd_repstat != 0 && error == 0)
4795		error = nd->nd_repstat;
4796nfsmout:
4797	if (error != 0 && flp != NULL)
4798		nfscl_freeflayout(flp);
4799	mbuf_freem(nd->nd_mrep);
4800	return (error);
4801}
4802
4803/*
4804 * Do the NFSv4.1 Get Device Info.
4805 */
4806int
4807nfsrpc_getdeviceinfo(struct nfsmount *nmp, uint8_t *deviceid, int layouttype,
4808    uint32_t *notifybitsp, struct nfscldevinfo **ndip, struct ucred *cred,
4809    NFSPROC_T *p)
4810{
4811	uint32_t cnt, *tl;
4812	struct nfsrv_descript nfsd;
4813	struct nfsrv_descript *nd = &nfsd;
4814	struct sockaddr_storage ss;
4815	struct nfsclds *dsp = NULL, **dspp;
4816	struct nfscldevinfo *ndi;
4817	int addrcnt, bitcnt, error, i, isudp, j, pos, safilled, stripecnt;
4818	uint8_t stripeindex;
4819
4820	*ndip = NULL;
4821	ndi = NULL;
4822	nfscl_reqstart(nd, NFSPROC_GETDEVICEINFO, nmp, NULL, 0, NULL, NULL);
4823	NFSM_BUILD(tl, uint32_t *, NFSX_V4DEVICEID + 3 * NFSX_UNSIGNED);
4824	NFSBCOPY(deviceid, tl, NFSX_V4DEVICEID);
4825	tl += (NFSX_V4DEVICEID / NFSX_UNSIGNED);
4826	*tl++ = txdr_unsigned(layouttype);
4827	*tl++ = txdr_unsigned(100000);
4828	if (notifybitsp != NULL && *notifybitsp != 0) {
4829		*tl = txdr_unsigned(1);		/* One word of bits. */
4830		NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
4831		*tl = txdr_unsigned(*notifybitsp);
4832	} else
4833		*tl = txdr_unsigned(0);
4834	nd->nd_flag |= ND_USEGSSNAME;
4835	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
4836	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
4837	if (error != 0)
4838		return (error);
4839	if (nd->nd_repstat == 0) {
4840		NFSM_DISSECT(tl, uint32_t *, 3 * NFSX_UNSIGNED);
4841		if (layouttype != fxdr_unsigned(int, *tl++))
4842			printf("EEK! devinfo layout type not same!\n");
4843		stripecnt = fxdr_unsigned(int, *++tl);
4844		NFSCL_DEBUG(4, "stripecnt=%d\n", stripecnt);
4845		if (stripecnt < 1 || stripecnt > 4096) {
4846			printf("NFS devinfo stripecnt %d: out of range\n",
4847			    stripecnt);
4848			error = NFSERR_BADXDR;
4849			goto nfsmout;
4850		}
4851		NFSM_DISSECT(tl, uint32_t *, (stripecnt + 1) * NFSX_UNSIGNED);
4852		addrcnt = fxdr_unsigned(int, *(tl + stripecnt));
4853		NFSCL_DEBUG(4, "addrcnt=%d\n", addrcnt);
4854		if (addrcnt < 1 || addrcnt > 128) {
4855			printf("NFS devinfo addrcnt %d: out of range\n",
4856			    addrcnt);
4857			error = NFSERR_BADXDR;
4858			goto nfsmout;
4859		}
4860
4861		/*
4862		 * Now we know how many stripe indices and addresses, so
4863		 * we can allocate the structure the correct size.
4864		 */
4865		i = (stripecnt * sizeof(uint8_t)) / sizeof(struct nfsclds *)
4866		    + 1;
4867		NFSCL_DEBUG(4, "stripeindices=%d\n", i);
4868		ndi = malloc(sizeof(*ndi) + (addrcnt + i) *
4869		    sizeof(struct nfsclds *), M_NFSDEVINFO, M_WAITOK | M_ZERO);
4870		NFSBCOPY(deviceid, ndi->nfsdi_deviceid, NFSX_V4DEVICEID);
4871		ndi->nfsdi_refcnt = 0;
4872		ndi->nfsdi_stripecnt = stripecnt;
4873		ndi->nfsdi_addrcnt = addrcnt;
4874		/* Fill in the stripe indices. */
4875		for (i = 0; i < stripecnt; i++) {
4876			stripeindex = fxdr_unsigned(uint8_t, *tl++);
4877			NFSCL_DEBUG(4, "stripeind=%d\n", stripeindex);
4878			if (stripeindex >= addrcnt) {
4879				printf("NFS devinfo stripeindex %d: too big\n",
4880				    (int)stripeindex);
4881				error = NFSERR_BADXDR;
4882				goto nfsmout;
4883			}
4884			nfsfldi_setstripeindex(ndi, i, stripeindex);
4885		}
4886
4887		/* Now, dissect the server address(es). */
4888		safilled = 0;
4889		for (i = 0; i < addrcnt; i++) {
4890			NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4891			cnt = fxdr_unsigned(uint32_t, *tl);
4892			if (cnt == 0) {
4893				printf("NFS devinfo 0 len addrlist\n");
4894				error = NFSERR_BADXDR;
4895				goto nfsmout;
4896			}
4897			dspp = nfsfldi_addr(ndi, i);
4898			pos = arc4random() % cnt;	/* Choose one. */
4899			safilled = 0;
4900			for (j = 0; j < cnt; j++) {
4901				error = nfsv4_getipaddr(nd, &ss, &isudp);
4902				if (error != 0 && error != EPERM) {
4903					error = NFSERR_BADXDR;
4904					goto nfsmout;
4905				}
4906				if (error == 0 && isudp == 0) {
4907					/*
4908					 * The algorithm is:
4909					 * - use "pos" entry if it is of the
4910					 *   same af_family or none of them
4911					 *   is of the same af_family
4912					 * else
4913					 * - use the first one of the same
4914					 *   af_family.
4915					 */
4916					if ((safilled == 0 && ss.ss_family ==
4917					     nmp->nm_nam->sa_family) ||
4918					    (j == pos &&
4919					     (safilled == 0 || ss.ss_family ==
4920					      nmp->nm_nam->sa_family)) ||
4921					    (safilled == 1 && ss.ss_family ==
4922					     nmp->nm_nam->sa_family)) {
4923						error = nfsrpc_fillsa(nmp, &ss,
4924						    &dsp, p);
4925						if (error == 0) {
4926							*dspp = dsp;
4927							if (ss.ss_family ==
4928							 nmp->nm_nam->sa_family)
4929								safilled = 2;
4930							else
4931								safilled = 1;
4932						}
4933					}
4934				}
4935			}
4936			if (safilled == 0)
4937				break;
4938		}
4939
4940		/* And the notify bits. */
4941		NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4942		if (safilled != 0) {
4943			bitcnt = fxdr_unsigned(int, *tl);
4944			if (bitcnt > 0) {
4945				NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
4946				if (notifybitsp != NULL)
4947					*notifybitsp =
4948					    fxdr_unsigned(uint32_t, *tl);
4949			}
4950			*ndip = ndi;
4951		} else
4952			error = EPERM;
4953	}
4954	if (nd->nd_repstat != 0)
4955		error = nd->nd_repstat;
4956nfsmout:
4957	if (error != 0 && ndi != NULL)
4958		nfscl_freedevinfo(ndi);
4959	mbuf_freem(nd->nd_mrep);
4960	return (error);
4961}
4962
4963/*
4964 * Do the NFSv4.1 LayoutCommit.
4965 */
4966int
4967nfsrpc_layoutcommit(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
4968    uint64_t off, uint64_t len, uint64_t lastbyte, nfsv4stateid_t *stateidp,
4969    int layouttype, int layoutupdatecnt, uint8_t *layp, struct ucred *cred,
4970    NFSPROC_T *p, void *stuff)
4971{
4972	uint32_t *tl;
4973	struct nfsrv_descript nfsd, *nd = &nfsd;
4974	int error, outcnt, i;
4975	uint8_t *cp;
4976
4977	nfscl_reqstart(nd, NFSPROC_LAYOUTCOMMIT, nmp, fh, fhlen, NULL, NULL);
4978	NFSM_BUILD(tl, uint32_t *, 5 * NFSX_UNSIGNED + 3 * NFSX_HYPER +
4979	    NFSX_STATEID);
4980	txdr_hyper(off, tl);
4981	tl += 2;
4982	txdr_hyper(len, tl);
4983	tl += 2;
4984	if (reclaim != 0)
4985		*tl++ = newnfs_true;
4986	else
4987		*tl++ = newnfs_false;
4988	*tl++ = txdr_unsigned(stateidp->seqid);
4989	*tl++ = stateidp->other[0];
4990	*tl++ = stateidp->other[1];
4991	*tl++ = stateidp->other[2];
4992	*tl++ = newnfs_true;
4993	if (lastbyte < off)
4994		lastbyte = off;
4995	else if (lastbyte >= (off + len))
4996		lastbyte = off + len - 1;
4997	txdr_hyper(lastbyte, tl);
4998	tl += 2;
4999	*tl++ = newnfs_false;
5000	*tl++ = txdr_unsigned(layouttype);
5001	*tl = txdr_unsigned(layoutupdatecnt);
5002	if (layoutupdatecnt > 0) {
5003		KASSERT(layouttype != NFSLAYOUT_NFSV4_1_FILES,
5004		    ("Must be nil for Files Layout"));
5005		outcnt = NFSM_RNDUP(layoutupdatecnt);
5006		NFSM_BUILD(cp, uint8_t *, outcnt);
5007		NFSBCOPY(layp, cp, layoutupdatecnt);
5008		cp += layoutupdatecnt;
5009		for (i = 0; i < (outcnt - layoutupdatecnt); i++)
5010			*cp++ = 0x0;
5011	}
5012	nd->nd_flag |= ND_USEGSSNAME;
5013	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5014	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5015	if (error != 0)
5016		return (error);
5017	error = nd->nd_repstat;
5018	mbuf_freem(nd->nd_mrep);
5019	return (error);
5020}
5021
5022/*
5023 * Do the NFSv4.1 LayoutReturn.
5024 */
5025int
5026nfsrpc_layoutreturn(struct nfsmount *nmp, uint8_t *fh, int fhlen, int reclaim,
5027    int layouttype, uint32_t iomode, int layoutreturn, uint64_t offset,
5028    uint64_t len, nfsv4stateid_t *stateidp, int layoutcnt, uint32_t *layp,
5029    struct ucred *cred, NFSPROC_T *p, void *stuff)
5030{
5031	uint32_t *tl;
5032	struct nfsrv_descript nfsd, *nd = &nfsd;
5033	int error, outcnt, i;
5034	uint8_t *cp;
5035
5036	nfscl_reqstart(nd, NFSPROC_LAYOUTRETURN, nmp, fh, fhlen, NULL, NULL);
5037	NFSM_BUILD(tl, uint32_t *, 4 * NFSX_UNSIGNED);
5038	if (reclaim != 0)
5039		*tl++ = newnfs_true;
5040	else
5041		*tl++ = newnfs_false;
5042	*tl++ = txdr_unsigned(layouttype);
5043	*tl++ = txdr_unsigned(iomode);
5044	*tl = txdr_unsigned(layoutreturn);
5045	if (layoutreturn == NFSLAYOUTRETURN_FILE) {
5046		NFSM_BUILD(tl, uint32_t *, 2 * NFSX_HYPER + NFSX_STATEID +
5047		    NFSX_UNSIGNED);
5048		txdr_hyper(offset, tl);
5049		tl += 2;
5050		txdr_hyper(len, tl);
5051		tl += 2;
5052		NFSCL_DEBUG(4, "layoutret stseq=%d\n", (int)stateidp->seqid);
5053		*tl++ = txdr_unsigned(stateidp->seqid);
5054		*tl++ = stateidp->other[0];
5055		*tl++ = stateidp->other[1];
5056		*tl++ = stateidp->other[2];
5057		*tl = txdr_unsigned(layoutcnt);
5058		if (layoutcnt > 0) {
5059			outcnt = NFSM_RNDUP(layoutcnt);
5060			NFSM_BUILD(cp, uint8_t *, outcnt);
5061			NFSBCOPY(layp, cp, layoutcnt);
5062			cp += layoutcnt;
5063			for (i = 0; i < (outcnt - layoutcnt); i++)
5064				*cp++ = 0x0;
5065		}
5066	}
5067	nd->nd_flag |= ND_USEGSSNAME;
5068	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5069	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5070	if (error != 0)
5071		return (error);
5072	if (nd->nd_repstat == 0) {
5073		NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5074		if (*tl != 0) {
5075			NFSM_DISSECT(tl, uint32_t *, NFSX_STATEID);
5076			stateidp->seqid = fxdr_unsigned(uint32_t, *tl++);
5077			stateidp->other[0] = *tl++;
5078			stateidp->other[1] = *tl++;
5079			stateidp->other[2] = *tl;
5080		}
5081	} else
5082		error = nd->nd_repstat;
5083nfsmout:
5084	mbuf_freem(nd->nd_mrep);
5085	return (error);
5086}
5087
5088/*
5089 * Acquire a layout and devinfo, if possible. The caller must have acquired
5090 * a reference count on the nfsclclient structure before calling this.
5091 * Return the layout in lypp with a reference count on it, if successful.
5092 */
5093static int
5094nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
5095    int iomode, uint32_t *notifybitsp, nfsv4stateid_t *stateidp, uint64_t off,
5096    struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
5097{
5098	struct nfscllayout *lyp;
5099	struct nfsclflayout *flp, *tflp;
5100	struct nfscldevinfo *dip;
5101	struct nfsclflayouthead flh;
5102	int error = 0, islocked, layoutlen, recalled, retonclose;
5103	nfsv4stateid_t stateid;
5104
5105	*lypp = NULL;
5106	/*
5107	 * If lyp is returned non-NULL, there will be a refcnt (shared lock)
5108	 * on it, iff flp != NULL or a lock (exclusive lock) on it iff
5109	 * flp == NULL.
5110	 */
5111	lyp = nfscl_getlayout(nmp->nm_clp, nfhp->nfh_fh, nfhp->nfh_len,
5112	    off, &flp, &recalled);
5113	islocked = 0;
5114	if (lyp == NULL || flp == NULL) {
5115		if (recalled != 0)
5116			return (EIO);
5117		LIST_INIT(&flh);
5118		layoutlen = NFSMNT_MDSSESSION(nmp)->nfsess_maxcache -
5119		    (NFSX_STATEID + 3 * NFSX_UNSIGNED);
5120		if (lyp == NULL) {
5121			stateid.seqid = 0;
5122			stateid.other[0] = stateidp->other[0];
5123			stateid.other[1] = stateidp->other[1];
5124			stateid.other[2] = stateidp->other[2];
5125			error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5126			    nfhp->nfh_len, iomode, (uint64_t)0, INT64_MAX,
5127			    (uint64_t)0, layoutlen, &stateid, &retonclose,
5128			    &flh, cred, p, NULL);
5129		} else {
5130			islocked = 1;
5131			stateid.seqid = lyp->nfsly_stateid.seqid;
5132			stateid.other[0] = lyp->nfsly_stateid.other[0];
5133			stateid.other[1] = lyp->nfsly_stateid.other[1];
5134			stateid.other[2] = lyp->nfsly_stateid.other[2];
5135			error = nfsrpc_layoutget(nmp, nfhp->nfh_fh,
5136			    nfhp->nfh_len, iomode, off, INT64_MAX,
5137			    (uint64_t)0, layoutlen, &stateid, &retonclose,
5138			    &flh, cred, p, NULL);
5139		}
5140		if (error == 0)
5141			LIST_FOREACH(tflp, &flh, nfsfl_list) {
5142				error = nfscl_adddevinfo(nmp, NULL, tflp);
5143				if (error != 0) {
5144					error = nfsrpc_getdeviceinfo(nmp,
5145					    tflp->nfsfl_dev,
5146					    NFSLAYOUT_NFSV4_1_FILES,
5147					    notifybitsp, &dip, cred, p);
5148					if (error != 0)
5149						break;
5150					error = nfscl_adddevinfo(nmp, dip,
5151					    tflp);
5152					if (error != 0)
5153						printf(
5154						    "getlayout: cannot add\n");
5155				}
5156			}
5157		if (error == 0) {
5158			/*
5159			 * nfscl_layout() always returns with the nfsly_lock
5160			 * set to a refcnt (shared lock).
5161			 */
5162			error = nfscl_layout(nmp, vp, nfhp->nfh_fh,
5163			    nfhp->nfh_len, &stateid, retonclose, &flh, &lyp,
5164			    cred, p);
5165			if (error == 0)
5166				*lypp = lyp;
5167		} else if (islocked != 0)
5168			nfsv4_unlock(&lyp->nfsly_lock, 0);
5169	} else
5170		*lypp = lyp;
5171	return (error);
5172}
5173
5174/*
5175 * Do a TCP connection plus exchange id and create session.
5176 * If successful, a "struct nfsclds" is linked into the list for the
5177 * mount point and a pointer to it is returned.
5178 */
5179static int
5180nfsrpc_fillsa(struct nfsmount *nmp, struct sockaddr_storage *ssp,
5181    struct nfsclds **dspp, NFSPROC_T *p)
5182{
5183	struct sockaddr_in *msad, *sad, *ssd;
5184	struct sockaddr_in6 *msad6, *sad6, *ssd6;
5185	struct nfsclclient *clp;
5186	struct nfssockreq *nrp;
5187	struct nfsclds *dsp, *tdsp;
5188	int error;
5189	enum nfsclds_state retv;
5190	uint32_t sequenceid;
5191
5192	KASSERT(nmp->nm_sockreq.nr_cred != NULL,
5193	    ("nfsrpc_fillsa: NULL nr_cred"));
5194	NFSLOCKCLSTATE();
5195	clp = nmp->nm_clp;
5196	NFSUNLOCKCLSTATE();
5197	if (clp == NULL)
5198		return (EPERM);
5199	if (ssp->ss_family == AF_INET) {
5200		ssd = (struct sockaddr_in *)ssp;
5201		NFSLOCKMNT(nmp);
5202
5203		/*
5204		 * Check to see if we already have a session for this
5205		 * address that is usable for a DS.
5206		 * Note that the MDS's address is in a different place
5207		 * than the sessions already acquired for DS's.
5208		 */
5209		msad = (struct sockaddr_in *)nmp->nm_sockreq.nr_nam;
5210		tdsp = TAILQ_FIRST(&nmp->nm_sess);
5211		while (tdsp != NULL) {
5212			if (msad != NULL && msad->sin_family == AF_INET &&
5213			    ssd->sin_addr.s_addr == msad->sin_addr.s_addr &&
5214			    ssd->sin_port == msad->sin_port &&
5215			    (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5216				*dspp = tdsp;
5217				NFSUNLOCKMNT(nmp);
5218				NFSCL_DEBUG(4, "fnd same addr\n");
5219				return (0);
5220			}
5221			tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5222			if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5223				msad = (struct sockaddr_in *)
5224				    tdsp->nfsclds_sockp->nr_nam;
5225			else
5226				msad = NULL;
5227		}
5228		NFSUNLOCKMNT(nmp);
5229
5230		/* No IP address match, so look for new/trunked one. */
5231		sad = malloc(sizeof(*sad), M_SONAME, M_WAITOK | M_ZERO);
5232		sad->sin_len = sizeof(*sad);
5233		sad->sin_family = AF_INET;
5234		sad->sin_port = ssd->sin_port;
5235		sad->sin_addr.s_addr = ssd->sin_addr.s_addr;
5236		nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5237		nrp->nr_nam = (struct sockaddr *)sad;
5238	} else if (ssp->ss_family == AF_INET6) {
5239		ssd6 = (struct sockaddr_in6 *)ssp;
5240		NFSLOCKMNT(nmp);
5241
5242		/*
5243		 * Check to see if we already have a session for this
5244		 * address that is usable for a DS.
5245		 * Note that the MDS's address is in a different place
5246		 * than the sessions already acquired for DS's.
5247		 */
5248		msad6 = (struct sockaddr_in6 *)nmp->nm_sockreq.nr_nam;
5249		tdsp = TAILQ_FIRST(&nmp->nm_sess);
5250		while (tdsp != NULL) {
5251			if (msad6 != NULL && msad6->sin6_family == AF_INET6 &&
5252			    IN6_ARE_ADDR_EQUAL(&ssd6->sin6_addr,
5253			    &msad6->sin6_addr) &&
5254			    ssd6->sin6_port == msad6->sin6_port &&
5255			    (tdsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5256				*dspp = tdsp;
5257				NFSUNLOCKMNT(nmp);
5258				return (0);
5259			}
5260			tdsp = TAILQ_NEXT(tdsp, nfsclds_list);
5261			if (tdsp != NULL && tdsp->nfsclds_sockp != NULL)
5262				msad6 = (struct sockaddr_in6 *)
5263				    tdsp->nfsclds_sockp->nr_nam;
5264			else
5265				msad6 = NULL;
5266		}
5267		NFSUNLOCKMNT(nmp);
5268
5269		/* No IP address match, so look for new/trunked one. */
5270		sad6 = malloc(sizeof(*sad6), M_SONAME, M_WAITOK | M_ZERO);
5271		sad6->sin6_len = sizeof(*sad6);
5272		sad6->sin6_family = AF_INET6;
5273		sad6->sin6_port = ssd6->sin6_port;
5274		NFSBCOPY(&ssd6->sin6_addr, &sad6->sin6_addr,
5275		    sizeof(struct in6_addr));
5276		nrp = malloc(sizeof(*nrp), M_NFSSOCKREQ, M_WAITOK | M_ZERO);
5277		nrp->nr_nam = (struct sockaddr *)sad6;
5278	} else
5279		return (EPERM);
5280
5281	nrp->nr_sotype = SOCK_STREAM;
5282	mtx_init(&nrp->nr_mtx, "nfssock", NULL, MTX_DEF);
5283	nrp->nr_prog = NFS_PROG;
5284	nrp->nr_vers = NFS_VER4;
5285
5286	/*
5287	 * Use the credentials that were used for the mount, which are
5288	 * in nmp->nm_sockreq.nr_cred for newnfs_connect() etc.
5289	 * Ref. counting the credentials with crhold() is probably not
5290	 * necessary, since nm_sockreq.nr_cred won't be crfree()'d until
5291	 * unmount, but I did it anyhow.
5292	 */
5293	nrp->nr_cred = crhold(nmp->nm_sockreq.nr_cred);
5294	error = newnfs_connect(nmp, nrp, NULL, p, 0);
5295	NFSCL_DEBUG(3, "DS connect=%d\n", error);
5296
5297	/* Now, do the exchangeid and create session. */
5298	if (error == 0)
5299		error = nfsrpc_exchangeid(nmp, clp, nrp, NFSV4EXCH_USEPNFSDS,
5300		    &dsp, nrp->nr_cred, p);
5301	NFSCL_DEBUG(3, "DS exchangeid=%d\n", error);
5302	if (error == 0) {
5303		dsp->nfsclds_sockp = nrp;
5304		NFSLOCKMNT(nmp);
5305		retv = nfscl_getsameserver(nmp, dsp, &tdsp);
5306		NFSCL_DEBUG(3, "getsame ret=%d\n", retv);
5307		if (retv == NFSDSP_USETHISSESSION) {
5308			NFSUNLOCKMNT(nmp);
5309			/*
5310			 * If there is already a session for this server,
5311			 * use it.
5312			 */
5313			(void)newnfs_disconnect(nrp);
5314			nfscl_freenfsclds(dsp);
5315			*dspp = tdsp;
5316			return (0);
5317		}
5318		if (retv == NFSDSP_SEQTHISSESSION)
5319			sequenceid = tdsp->nfsclds_sess.nfsess_sequenceid;
5320		else
5321			sequenceid = dsp->nfsclds_sess.nfsess_sequenceid;
5322		NFSUNLOCKMNT(nmp);
5323		error = nfsrpc_createsession(nmp, &dsp->nfsclds_sess,
5324		    nrp, sequenceid, 0, nrp->nr_cred, p);
5325		NFSCL_DEBUG(3, "DS createsess=%d\n", error);
5326	} else {
5327		NFSFREECRED(nrp->nr_cred);
5328		NFSFREEMUTEX(&nrp->nr_mtx);
5329		free(nrp->nr_nam, M_SONAME);
5330		free(nrp, M_NFSSOCKREQ);
5331	}
5332	if (error == 0) {
5333		NFSCL_DEBUG(3, "add DS session\n");
5334		/*
5335		 * Put it at the end of the list. That way the list
5336		 * is ordered by when the entry was added. This matters
5337		 * since the one done first is the one that should be
5338		 * used for sequencid'ing any subsequent create sessions.
5339		 */
5340		NFSLOCKMNT(nmp);
5341		TAILQ_INSERT_TAIL(&nmp->nm_sess, dsp, nfsclds_list);
5342		NFSUNLOCKMNT(nmp);
5343		*dspp = dsp;
5344	} else if (dsp != NULL)
5345		nfscl_freenfsclds(dsp);
5346	return (error);
5347}
5348
5349/*
5350 * Do the NFSv4.1 Reclaim Complete.
5351 */
5352int
5353nfsrpc_reclaimcomplete(struct nfsmount *nmp, struct ucred *cred, NFSPROC_T *p)
5354{
5355	uint32_t *tl;
5356	struct nfsrv_descript nfsd;
5357	struct nfsrv_descript *nd = &nfsd;
5358	int error;
5359
5360	nfscl_reqstart(nd, NFSPROC_RECLAIMCOMPL, nmp, NULL, 0, NULL, NULL);
5361	NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED);
5362	*tl = newnfs_false;
5363	nd->nd_flag |= ND_USEGSSNAME;
5364	error = newnfs_request(nd, nmp, NULL, &nmp->nm_sockreq, NULL, p, cred,
5365	    NFS_PROG, NFS_VER4, NULL, 1, NULL, NULL);
5366	if (error != 0)
5367		return (error);
5368	error = nd->nd_repstat;
5369	mbuf_freem(nd->nd_mrep);
5370	return (error);
5371}
5372
5373/*
5374 * Initialize the slot tables for a session.
5375 */
5376static void
5377nfscl_initsessionslots(struct nfsclsession *sep)
5378{
5379	int i;
5380
5381	for (i = 0; i < NFSV4_CBSLOTS; i++) {
5382		if (sep->nfsess_cbslots[i].nfssl_reply != NULL)
5383			m_freem(sep->nfsess_cbslots[i].nfssl_reply);
5384		NFSBZERO(&sep->nfsess_cbslots[i], sizeof(struct nfsslot));
5385	}
5386	for (i = 0; i < 64; i++)
5387		sep->nfsess_slotseq[i] = 0;
5388	sep->nfsess_slots = 0;
5389}
5390
5391/*
5392 * Called to try and do an I/O operation via an NFSv4.1 Data Server (DS).
5393 */
5394int
5395nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5396    uint32_t rwaccess, struct ucred *cred, NFSPROC_T *p)
5397{
5398	struct nfsnode *np = VTONFS(vp);
5399	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5400	struct nfscllayout *layp;
5401	struct nfscldevinfo *dip;
5402	struct nfsclflayout *rflp;
5403	nfsv4stateid_t stateid;
5404	struct ucred *newcred;
5405	uint64_t lastbyte, len, off, oresid, xfer;
5406	int eof, error, iolaymode, recalled;
5407	void *lckp;
5408
5409	if (!NFSHASPNFS(nmp) || nfscl_enablecallb == 0 || nfs_numnfscbd == 0 ||
5410	    (np->n_flag & NNOLAYOUT) != 0)
5411		return (EIO);
5412	/* Now, get a reference cnt on the clientid for this mount. */
5413	if (nfscl_getref(nmp) == 0)
5414		return (EIO);
5415
5416	/* Find an appropriate stateid. */
5417	newcred = NFSNEWCRED(cred);
5418	error = nfscl_getstateid(vp, np->n_fhp->nfh_fh, np->n_fhp->nfh_len,
5419	    rwaccess, 1, newcred, p, &stateid, &lckp);
5420	if (error != 0) {
5421		NFSFREECRED(newcred);
5422		nfscl_relref(nmp);
5423		return (error);
5424	}
5425	/* Search for a layout for this file. */
5426	off = uiop->uio_offset;
5427	layp = nfscl_getlayout(nmp->nm_clp, np->n_fhp->nfh_fh,
5428	    np->n_fhp->nfh_len, off, &rflp, &recalled);
5429	if (layp == NULL || rflp == NULL) {
5430		if (recalled != 0) {
5431			NFSFREECRED(newcred);
5432			nfscl_relref(nmp);
5433			return (EIO);
5434		}
5435		if (layp != NULL) {
5436			nfscl_rellayout(layp, (rflp == NULL) ? 1 : 0);
5437			layp = NULL;
5438		}
5439		/* Try and get a Layout, if it is supported. */
5440		if (rwaccess == NFSV4OPEN_ACCESSWRITE ||
5441		    (np->n_flag & NWRITEOPENED) != 0)
5442			iolaymode = NFSLAYOUTIOMODE_RW;
5443		else
5444			iolaymode = NFSLAYOUTIOMODE_READ;
5445		error = nfsrpc_getlayout(nmp, vp, np->n_fhp, iolaymode,
5446		    NULL, &stateid, off, &layp, newcred, p);
5447		if (error != 0) {
5448			NFSLOCKNODE(np);
5449			np->n_flag |= NNOLAYOUT;
5450			NFSUNLOCKNODE(np);
5451			if (lckp != NULL)
5452				nfscl_lockderef(lckp);
5453			NFSFREECRED(newcred);
5454			if (layp != NULL)
5455				nfscl_rellayout(layp, 0);
5456			nfscl_relref(nmp);
5457			return (error);
5458		}
5459	}
5460
5461	/*
5462	 * Loop around finding a layout that works for the first part of
5463	 * this I/O operation, and then call the function that actually
5464	 * does the RPC.
5465	 */
5466	eof = 0;
5467	len = (uint64_t)uiop->uio_resid;
5468	while (len > 0 && error == 0 && eof == 0) {
5469		off = uiop->uio_offset;
5470		error = nfscl_findlayoutforio(layp, off, rwaccess, &rflp);
5471		if (error == 0) {
5472			oresid = xfer = (uint64_t)uiop->uio_resid;
5473			if (xfer > (rflp->nfsfl_end - rflp->nfsfl_off))
5474				xfer = rflp->nfsfl_end - rflp->nfsfl_off;
5475			dip = nfscl_getdevinfo(nmp->nm_clp, rflp->nfsfl_dev,
5476			    rflp->nfsfl_devp);
5477			if (dip != NULL) {
5478				error = nfscl_doflayoutio(vp, uiop, iomode,
5479				    must_commit, &eof, &stateid, rwaccess, dip,
5480				    layp, rflp, off, xfer, newcred, p);
5481				nfscl_reldevinfo(dip);
5482				lastbyte = off + xfer - 1;
5483				if (error == 0) {
5484					NFSLOCKCLSTATE();
5485					if (lastbyte > layp->nfsly_lastbyte)
5486						layp->nfsly_lastbyte = lastbyte;
5487					NFSUNLOCKCLSTATE();
5488				}
5489			} else
5490				error = EIO;
5491			if (error == 0)
5492				len -= (oresid - (uint64_t)uiop->uio_resid);
5493		}
5494	}
5495	if (lckp != NULL)
5496		nfscl_lockderef(lckp);
5497	NFSFREECRED(newcred);
5498	nfscl_rellayout(layp, 0);
5499	nfscl_relref(nmp);
5500	return (error);
5501}
5502
5503/*
5504 * Find a file layout that will handle the first bytes of the requested
5505 * range and return the information from it needed to to the I/O operation.
5506 */
5507int
5508nfscl_findlayoutforio(struct nfscllayout *lyp, uint64_t off, uint32_t rwaccess,
5509    struct nfsclflayout **retflpp)
5510{
5511	struct nfsclflayout *flp, *nflp, *rflp;
5512	uint32_t rw;
5513
5514	rflp = NULL;
5515	rw = rwaccess;
5516	/* For reading, do the Read list first and then the Write list. */
5517	do {
5518		if (rw == NFSV4OPEN_ACCESSREAD)
5519			flp = LIST_FIRST(&lyp->nfsly_flayread);
5520		else
5521			flp = LIST_FIRST(&lyp->nfsly_flayrw);
5522		while (flp != NULL) {
5523			nflp = LIST_NEXT(flp, nfsfl_list);
5524			if (flp->nfsfl_off > off)
5525				break;
5526			if (flp->nfsfl_end > off &&
5527			    (rflp == NULL || rflp->nfsfl_end < flp->nfsfl_end))
5528				rflp = flp;
5529			flp = nflp;
5530		}
5531		if (rw == NFSV4OPEN_ACCESSREAD)
5532			rw = NFSV4OPEN_ACCESSWRITE;
5533		else
5534			rw = 0;
5535	} while (rw != 0);
5536	if (rflp != NULL) {
5537		/* This one covers the most bytes starting at off. */
5538		*retflpp = rflp;
5539		return (0);
5540	}
5541	return (EIO);
5542}
5543
5544/*
5545 * Do I/O using an NFSv4.1 file layout.
5546 */
5547static int
5548nfscl_doflayoutio(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5549    int *eofp, nfsv4stateid_t *stateidp, int rwflag, struct nfscldevinfo *dp,
5550    struct nfscllayout *lyp, struct nfsclflayout *flp, uint64_t off,
5551    uint64_t len, struct ucred *cred, NFSPROC_T *p)
5552{
5553	uint64_t io_off, rel_off, stripe_unit_size, transfer, xfer;
5554	int commit_thru_mds, error = 0, stripe_index, stripe_pos;
5555	struct nfsnode *np;
5556	struct nfsfh *fhp;
5557	struct nfsclds **dspp;
5558
5559	np = VTONFS(vp);
5560	rel_off = off - flp->nfsfl_patoff;
5561	stripe_unit_size = (flp->nfsfl_util >> 6) & 0x3ffffff;
5562	stripe_pos = (rel_off / stripe_unit_size + flp->nfsfl_stripe1) %
5563	    dp->nfsdi_stripecnt;
5564	transfer = stripe_unit_size - (rel_off % stripe_unit_size);
5565
5566	/* Loop around, doing I/O for each stripe unit. */
5567	while (len > 0 && error == 0) {
5568		stripe_index = nfsfldi_stripeindex(dp, stripe_pos);
5569		dspp = nfsfldi_addr(dp, stripe_index);
5570		if (len > transfer)
5571			xfer = transfer;
5572		else
5573			xfer = len;
5574		if ((flp->nfsfl_util & NFSFLAYUTIL_DENSE) != 0) {
5575			/* Dense layout. */
5576			if (stripe_pos >= flp->nfsfl_fhcnt)
5577				return (EIO);
5578			fhp = flp->nfsfl_fh[stripe_pos];
5579			io_off = (rel_off / (stripe_unit_size *
5580			    dp->nfsdi_stripecnt)) * stripe_unit_size +
5581			    rel_off % stripe_unit_size;
5582		} else {
5583			/* Sparse layout. */
5584			if (flp->nfsfl_fhcnt > 1) {
5585				if (stripe_index >= flp->nfsfl_fhcnt)
5586					return (EIO);
5587				fhp = flp->nfsfl_fh[stripe_index];
5588			} else if (flp->nfsfl_fhcnt == 1)
5589				fhp = flp->nfsfl_fh[0];
5590			else
5591				fhp = np->n_fhp;
5592			io_off = off;
5593		}
5594		if ((flp->nfsfl_util & NFSFLAYUTIL_COMMIT_THRU_MDS) != 0)
5595			commit_thru_mds = 1;
5596		else
5597			commit_thru_mds = 0;
5598		if (rwflag == FREAD)
5599			error = nfsrpc_readds(vp, uiop, stateidp, eofp, *dspp,
5600			    io_off, xfer, fhp, cred, p);
5601		else {
5602			error = nfsrpc_writeds(vp, uiop, iomode, must_commit,
5603			    stateidp, *dspp, io_off, xfer, fhp, commit_thru_mds,
5604			    cred, p);
5605			if (error == 0) {
5606				NFSLOCKCLSTATE();
5607				lyp->nfsly_flags |= NFSLY_WRITTEN;
5608				NFSUNLOCKCLSTATE();
5609			}
5610		}
5611		if (error == 0) {
5612			transfer = stripe_unit_size;
5613			stripe_pos = (stripe_pos + 1) % dp->nfsdi_stripecnt;
5614			len -= xfer;
5615			off += xfer;
5616		}
5617	}
5618	return (error);
5619}
5620
5621/*
5622 * The actual read RPC done to a DS.
5623 */
5624static int
5625nfsrpc_readds(vnode_t vp, struct uio *uiop, nfsv4stateid_t *stateidp, int *eofp,
5626    struct nfsclds *dsp, uint64_t io_off, int len, struct nfsfh *fhp,
5627    struct ucred *cred, NFSPROC_T *p)
5628{
5629	uint32_t *tl;
5630	int error, retlen;
5631	struct nfsrv_descript nfsd;
5632	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5633	struct nfsrv_descript *nd = &nfsd;
5634	struct nfssockreq *nrp;
5635
5636	nd->nd_mrep = NULL;
5637	nfscl_reqstart(nd, NFSPROC_READDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5638	    NULL, &dsp->nfsclds_sess);
5639	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5640	NFSM_BUILD(tl, uint32_t *, NFSX_UNSIGNED * 3);
5641	txdr_hyper(io_off, tl);
5642	*(tl + 2) = txdr_unsigned(len);
5643	nrp = dsp->nfsclds_sockp;
5644	if (nrp == NULL)
5645		/* If NULL, use the MDS socket. */
5646		nrp = &nmp->nm_sockreq;
5647	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5648	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5649	if (error != 0)
5650		return (error);
5651	if (nd->nd_repstat != 0) {
5652		error = nd->nd_repstat;
5653		goto nfsmout;
5654	}
5655	NFSM_DISSECT(tl, uint32_t *, NFSX_UNSIGNED);
5656	*eofp = fxdr_unsigned(int, *tl);
5657	NFSM_STRSIZ(retlen, len);
5658	error = nfsm_mbufuio(nd, uiop, retlen);
5659nfsmout:
5660	if (nd->nd_mrep != NULL)
5661		mbuf_freem(nd->nd_mrep);
5662	return (error);
5663}
5664
5665/*
5666 * The actual write RPC done to a DS.
5667 */
5668static int
5669nfsrpc_writeds(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
5670    nfsv4stateid_t *stateidp, struct nfsclds *dsp, uint64_t io_off, int len,
5671    struct nfsfh *fhp, int commit_thru_mds, struct ucred *cred, NFSPROC_T *p)
5672{
5673	uint32_t *tl;
5674	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5675	int error, rlen, commit, committed = NFSWRITE_FILESYNC;
5676	int32_t backup;
5677	struct nfsrv_descript nfsd;
5678	struct nfsrv_descript *nd = &nfsd;
5679	struct nfssockreq *nrp;
5680
5681	KASSERT(uiop->uio_iovcnt == 1, ("nfs: writerpc iovcnt > 1"));
5682	nd->nd_mrep = NULL;
5683	nfscl_reqstart(nd, NFSPROC_WRITEDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5684	    NULL, &dsp->nfsclds_sess);
5685	nfsm_stateidtom(nd, stateidp, NFSSTATEID_PUTSEQIDZERO);
5686	NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + 2 * NFSX_UNSIGNED);
5687	txdr_hyper(io_off, tl);
5688	tl += 2;
5689	*tl++ = txdr_unsigned(*iomode);
5690	*tl = txdr_unsigned(len);
5691	nfsm_uiombuf(nd, uiop, len);
5692	nrp = dsp->nfsclds_sockp;
5693	if (nrp == NULL)
5694		/* If NULL, use the MDS socket. */
5695		nrp = &nmp->nm_sockreq;
5696	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5697	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5698	if (error != 0)
5699		return (error);
5700	if (nd->nd_repstat != 0) {
5701		/*
5702		 * In case the rpc gets retried, roll
5703		 * the uio fileds changed by nfsm_uiombuf()
5704		 * back.
5705		 */
5706		uiop->uio_offset -= len;
5707		uio_uio_resid_add(uiop, len);
5708		uio_iov_base_add(uiop, -len);
5709		uio_iov_len_add(uiop, len);
5710		error = nd->nd_repstat;
5711	} else {
5712		NFSM_DISSECT(tl, uint32_t *, 2 * NFSX_UNSIGNED + NFSX_VERF);
5713		rlen = fxdr_unsigned(int, *tl++);
5714		if (rlen == 0) {
5715			error = NFSERR_IO;
5716			goto nfsmout;
5717		} else if (rlen < len) {
5718			backup = len - rlen;
5719			uio_iov_base_add(uiop, -(backup));
5720			uio_iov_len_add(uiop, backup);
5721			uiop->uio_offset -= backup;
5722			uio_uio_resid_add(uiop, backup);
5723			len = rlen;
5724		}
5725		commit = fxdr_unsigned(int, *tl++);
5726
5727		/*
5728		 * Return the lowest committment level
5729		 * obtained by any of the RPCs.
5730		 */
5731		if (committed == NFSWRITE_FILESYNC)
5732			committed = commit;
5733		else if (committed == NFSWRITE_DATASYNC &&
5734		    commit == NFSWRITE_UNSTABLE)
5735			committed = commit;
5736		if (commit_thru_mds != 0) {
5737			NFSLOCKMNT(nmp);
5738			if (!NFSHASWRITEVERF(nmp)) {
5739				NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5740				NFSSETWRITEVERF(nmp);
5741	    		} else if (NFSBCMP(tl, nmp->nm_verf, NFSX_VERF)) {
5742				*must_commit = 1;
5743				NFSBCOPY(tl, nmp->nm_verf, NFSX_VERF);
5744			}
5745			NFSUNLOCKMNT(nmp);
5746		} else {
5747			NFSLOCKDS(dsp);
5748			if ((dsp->nfsclds_flags & NFSCLDS_HASWRITEVERF) == 0) {
5749				NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5750				dsp->nfsclds_flags |= NFSCLDS_HASWRITEVERF;
5751			} else if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5752				*must_commit = 1;
5753				NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5754			}
5755			NFSUNLOCKDS(dsp);
5756		}
5757	}
5758nfsmout:
5759	if (nd->nd_mrep != NULL)
5760		mbuf_freem(nd->nd_mrep);
5761	*iomode = committed;
5762	if (nd->nd_repstat != 0 && error == 0)
5763		error = nd->nd_repstat;
5764	return (error);
5765}
5766
5767/*
5768 * Free up the nfsclds structure.
5769 */
5770void
5771nfscl_freenfsclds(struct nfsclds *dsp)
5772{
5773	int i;
5774
5775	if (dsp == NULL)
5776		return;
5777	if (dsp->nfsclds_sockp != NULL) {
5778		NFSFREECRED(dsp->nfsclds_sockp->nr_cred);
5779		NFSFREEMUTEX(&dsp->nfsclds_sockp->nr_mtx);
5780		free(dsp->nfsclds_sockp->nr_nam, M_SONAME);
5781		free(dsp->nfsclds_sockp, M_NFSSOCKREQ);
5782	}
5783	NFSFREEMUTEX(&dsp->nfsclds_mtx);
5784	NFSFREEMUTEX(&dsp->nfsclds_sess.nfsess_mtx);
5785	for (i = 0; i < NFSV4_CBSLOTS; i++) {
5786		if (dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply != NULL)
5787			m_freem(
5788			    dsp->nfsclds_sess.nfsess_cbslots[i].nfssl_reply);
5789	}
5790	free(dsp, M_NFSCLDS);
5791}
5792
5793static enum nfsclds_state
5794nfscl_getsameserver(struct nfsmount *nmp, struct nfsclds *newdsp,
5795    struct nfsclds **retdspp)
5796{
5797	struct nfsclds *dsp, *cur_dsp;
5798
5799	/*
5800	 * Search the list of nfsclds structures for one with the same
5801	 * server.
5802	 */
5803	cur_dsp = NULL;
5804	TAILQ_FOREACH(dsp, &nmp->nm_sess, nfsclds_list) {
5805		if (dsp->nfsclds_servownlen == newdsp->nfsclds_servownlen &&
5806		    dsp->nfsclds_servownlen != 0 &&
5807		    !NFSBCMP(dsp->nfsclds_serverown, newdsp->nfsclds_serverown,
5808		    dsp->nfsclds_servownlen)) {
5809			NFSCL_DEBUG(4, "fnd same fdsp=%p dsp=%p flg=0x%x\n",
5810			    TAILQ_FIRST(&nmp->nm_sess), dsp,
5811			    dsp->nfsclds_flags);
5812			/* Server major id matches. */
5813			if ((dsp->nfsclds_flags & NFSCLDS_DS) != 0) {
5814				*retdspp = dsp;
5815				return (NFSDSP_USETHISSESSION);
5816			}
5817
5818			/*
5819			 * Note the first match, so it can be used for
5820			 * sequence'ing new sessions.
5821			 */
5822			if (cur_dsp == NULL)
5823				cur_dsp = dsp;
5824		}
5825	}
5826	if (cur_dsp != NULL) {
5827		*retdspp = cur_dsp;
5828		return (NFSDSP_SEQTHISSESSION);
5829	}
5830	return (NFSDSP_NOTFOUND);
5831}
5832
5833#ifdef notyet
5834/*
5835 * NFS commit rpc to a DS.
5836 */
5837static int
5838nfsrpc_commitds(vnode_t vp, uint64_t offset, int cnt, struct nfsclds *dsp,
5839    struct nfsfh *fhp, struct ucred *cred, NFSPROC_T *p, void *stuff)
5840{
5841	uint32_t *tl;
5842	struct nfsrv_descript nfsd, *nd = &nfsd;
5843	struct nfsmount *nmp = VFSTONFS(vnode_mount(vp));
5844	struct nfssockreq *nrp;
5845	int error;
5846
5847	nfscl_reqstart(nd, NFSPROC_COMMITDS, nmp, fhp->nfh_fh, fhp->nfh_len,
5848	    NULL, &dsp->nfsclds_sess);
5849	NFSM_BUILD(tl, uint32_t *, NFSX_HYPER + NFSX_UNSIGNED);
5850	txdr_hyper(offset, tl);
5851	tl += 2;
5852	*tl = txdr_unsigned(cnt);
5853	nrp = dsp->nfsclds_sockp;
5854	if (nrp == NULL)
5855		/* If NULL, use the MDS socket. */
5856		nrp = &nmp->nm_sockreq;
5857	error = newnfs_request(nd, nmp, NULL, nrp, vp, p, cred,
5858	    NFS_PROG, NFS_VER4, NULL, 1, NULL, &dsp->nfsclds_sess);
5859	if (error)
5860		return (error);
5861	if (nd->nd_repstat == 0) {
5862		NFSM_DISSECT(tl, u_int32_t *, NFSX_VERF);
5863		NFSLOCKDS(dsp);
5864		if (NFSBCMP(tl, dsp->nfsclds_verf, NFSX_VERF)) {
5865			NFSBCOPY(tl, dsp->nfsclds_verf, NFSX_VERF);
5866			error = NFSERR_STALEWRITEVERF;
5867		}
5868		NFSUNLOCKDS(dsp);
5869	}
5870nfsmout:
5871	if (error == 0 && nd->nd_repstat != 0)
5872		error = nd->nd_repstat;
5873	mbuf_freem(nd->nd_mrep);
5874	return (error);
5875}
5876#endif
5877
5878