1/*
2 * Copyright (c) 2000-2011 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28/* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29/*
30 * Copyright (c) 1989, 1993
31 *	The Regents of the University of California.  All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 *    notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 *    notice, this list of conditions and the following disclaimer in the
43 *    documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 *    must display the following acknowledgement:
46 *	This product includes software developed by the University of
47 *	California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 *    may be used to endorse or promote products derived from this software
50 *    without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 *	@(#)nfs_subs.c	8.8 (Berkeley) 5/22/95
65 * FreeBSD-Id: nfs_subs.c,v 1.47 1997/11/07 08:53:24 phk Exp $
66 */
67
68/*
69 * These functions support the macros and help fiddle mbuf chains for
70 * the nfs op functions. They do things like create the rpc header and
71 * copy data between mbuf chains and uio lists.
72 */
73#include <sys/param.h>
74#include <sys/proc.h>
75#include <sys/kauth.h>
76#include <sys/systm.h>
77#include <sys/kernel.h>
78#include <sys/mount_internal.h>
79#include <sys/vnode_internal.h>
80#include <sys/kpi_mbuf.h>
81#include <sys/socket.h>
82#include <sys/stat.h>
83#include <sys/malloc.h>
84#include <sys/syscall.h>
85#include <sys/ubc_internal.h>
86#include <sys/fcntl.h>
87#include <sys/uio.h>
88#include <sys/domain.h>
89#include <libkern/OSAtomic.h>
90#include <kern/thread_call.h>
91
92#include <sys/vm.h>
93#include <sys/vmparam.h>
94
95#include <sys/time.h>
96#include <kern/clock.h>
97
98#include <nfs/rpcv2.h>
99#include <nfs/nfsproto.h>
100#include <nfs/nfs.h>
101#include <nfs/nfsnode.h>
102#if NFSCLIENT
103#define _NFS_XDR_SUBS_FUNCS_ /* define this to get xdrbuf function definitions */
104#endif
105#include <nfs/xdr_subs.h>
106#include <nfs/nfsm_subs.h>
107#include <nfs/nfs_gss.h>
108#include <nfs/nfsmount.h>
109#include <nfs/nfs_lock.h>
110
111#include <miscfs/specfs/specdev.h>
112
113#include <netinet/in.h>
114#include <net/kpi_interface.h>
115
116#include <sys/utfconv.h>
117
118/*
119 * NFS globals
120 */
121struct nfsstats	__attribute__((aligned(8))) nfsstats;
122size_t nfs_mbuf_mhlen = 0, nfs_mbuf_minclsize = 0;
123
124/*
125 * functions to convert between NFS and VFS types
126 */
127nfstype
128vtonfs_type(enum vtype vtype, int nfsvers)
129{
130	switch (vtype) {
131	case VNON:
132		return NFNON;
133	case VREG:
134		return NFREG;
135	case VDIR:
136		return NFDIR;
137	case VBLK:
138		return NFBLK;
139	case VCHR:
140		return NFCHR;
141	case VLNK:
142		return NFLNK;
143	case VSOCK:
144		if (nfsvers > NFS_VER2)
145			return NFSOCK;
146	case VFIFO:
147		if (nfsvers > NFS_VER2)
148			return NFFIFO;
149	case VBAD:
150	case VSTR:
151	case VCPLX:
152	default:
153		return NFNON;
154	}
155}
156
157enum vtype
158nfstov_type(nfstype nvtype, int nfsvers)
159{
160	switch (nvtype) {
161	case NFNON:
162		return VNON;
163	case NFREG:
164		return VREG;
165	case NFDIR:
166		return VDIR;
167	case NFBLK:
168		return VBLK;
169	case NFCHR:
170		return VCHR;
171	case NFLNK:
172		return VLNK;
173	case NFSOCK:
174		if (nfsvers > NFS_VER2)
175			return VSOCK;
176	case NFFIFO:
177		if (nfsvers > NFS_VER2)
178			return VFIFO;
179	case NFATTRDIR:
180		if (nfsvers > NFS_VER3)
181			return VDIR;
182	case NFNAMEDATTR:
183		if (nfsvers > NFS_VER3)
184			return VREG;
185	default:
186		return VNON;
187	}
188}
189
190int
191vtonfsv2_mode(enum vtype vtype, mode_t m)
192{
193	switch (vtype) {
194	case VNON:
195	case VREG:
196	case VDIR:
197	case VBLK:
198	case VCHR:
199	case VLNK:
200	case VSOCK:
201		return vnode_makeimode(vtype, m);
202	case VFIFO:
203		return vnode_makeimode(VCHR, m);
204	case VBAD:
205	case VSTR:
206	case VCPLX:
207	default:
208		return vnode_makeimode(VNON, m);
209	}
210}
211
212#if NFSSERVER
213
214/*
215 * Mapping of old NFS Version 2 RPC numbers to generic numbers.
216 */
217int nfsv3_procid[NFS_NPROCS] = {
218	NFSPROC_NULL,
219	NFSPROC_GETATTR,
220	NFSPROC_SETATTR,
221	NFSPROC_NOOP,
222	NFSPROC_LOOKUP,
223	NFSPROC_READLINK,
224	NFSPROC_READ,
225	NFSPROC_NOOP,
226	NFSPROC_WRITE,
227	NFSPROC_CREATE,
228	NFSPROC_REMOVE,
229	NFSPROC_RENAME,
230	NFSPROC_LINK,
231	NFSPROC_SYMLINK,
232	NFSPROC_MKDIR,
233	NFSPROC_RMDIR,
234	NFSPROC_READDIR,
235	NFSPROC_FSSTAT,
236	NFSPROC_NOOP,
237	NFSPROC_NOOP,
238	NFSPROC_NOOP,
239	NFSPROC_NOOP,
240	NFSPROC_NOOP
241};
242
243#endif /* NFSSERVER */
244
245/*
246 * and the reverse mapping from generic to Version 2 procedure numbers
247 */
248int nfsv2_procid[NFS_NPROCS] = {
249	NFSV2PROC_NULL,
250	NFSV2PROC_GETATTR,
251	NFSV2PROC_SETATTR,
252	NFSV2PROC_LOOKUP,
253	NFSV2PROC_NOOP,
254	NFSV2PROC_READLINK,
255	NFSV2PROC_READ,
256	NFSV2PROC_WRITE,
257	NFSV2PROC_CREATE,
258	NFSV2PROC_MKDIR,
259	NFSV2PROC_SYMLINK,
260	NFSV2PROC_CREATE,
261	NFSV2PROC_REMOVE,
262	NFSV2PROC_RMDIR,
263	NFSV2PROC_RENAME,
264	NFSV2PROC_LINK,
265	NFSV2PROC_READDIR,
266	NFSV2PROC_NOOP,
267	NFSV2PROC_STATFS,
268	NFSV2PROC_NOOP,
269	NFSV2PROC_NOOP,
270	NFSV2PROC_NOOP,
271	NFSV2PROC_NOOP
272};
273
274
275/*
276 * initialize NFS's cache of mbuf constants
277 */
278void
279nfs_mbuf_init(void)
280{
281	struct mbuf_stat ms;
282
283	mbuf_stats(&ms);
284	nfs_mbuf_mhlen = ms.mhlen;
285	nfs_mbuf_minclsize = ms.minclsize;
286}
287
288#if NFSSERVER
289
290/*
291 * allocate a list of mbufs to hold the given amount of data
292 */
293int
294nfsm_mbuf_get_list(size_t size, mbuf_t *mp, int *mbcnt)
295{
296	int error, cnt;
297	mbuf_t mhead, mlast, m;
298	size_t len, mlen;
299
300	error = cnt = 0;
301	mhead = mlast = NULL;
302	len = 0;
303
304	while (len < size) {
305		nfsm_mbuf_get(error, &m, (size - len));
306		if (error)
307			break;
308		if (!mhead)
309			mhead = m;
310		if (mlast && ((error = mbuf_setnext(mlast, m)))) {
311			mbuf_free(m);
312			break;
313		}
314		mlen = mbuf_maxlen(m);
315		if ((len + mlen) > size)
316			mlen = size - len;
317		mbuf_setlen(m, mlen);
318		len += mlen;
319		cnt++;
320		mlast = m;
321	}
322
323	if (!error) {
324		*mp = mhead;
325		*mbcnt = cnt;
326	}
327	return (error);
328}
329
330#endif /* NFSSERVER */
331
332/*
333 * nfsm_chain_new_mbuf()
334 *
335 * Add a new mbuf to the given chain.
336 */
337int
338nfsm_chain_new_mbuf(struct nfsm_chain *nmc, size_t sizehint)
339{
340	mbuf_t mb;
341	int error = 0;
342
343	if (nmc->nmc_flags & NFSM_CHAIN_FLAG_ADD_CLUSTERS)
344		sizehint = nfs_mbuf_minclsize;
345
346	/* allocate a new mbuf */
347	nfsm_mbuf_get(error, &mb, sizehint);
348	if (error)
349		return (error);
350	if (mb == NULL)
351		panic("got NULL mbuf?");
352
353	/* do we have a current mbuf? */
354	if (nmc->nmc_mcur) {
355		/* first cap off current mbuf */
356		mbuf_setlen(nmc->nmc_mcur, nmc->nmc_ptr - (caddr_t)mbuf_data(nmc->nmc_mcur));
357		/* then append the new mbuf */
358		error = mbuf_setnext(nmc->nmc_mcur, mb);
359		if (error) {
360			mbuf_free(mb);
361			return (error);
362		}
363	}
364
365	/* set up for using the new mbuf */
366	nmc->nmc_mcur = mb;
367	nmc->nmc_ptr = mbuf_data(mb);
368	nmc->nmc_left = mbuf_trailingspace(mb);
369
370	return (0);
371}
372
373/*
374 * nfsm_chain_add_opaque_f()
375 *
376 * Add "len" bytes of opaque data pointed to by "buf" to the given chain.
377 */
378int
379nfsm_chain_add_opaque_f(struct nfsm_chain *nmc, const u_char *buf, uint32_t len)
380{
381	uint32_t paddedlen, tlen;
382	int error;
383
384	paddedlen = nfsm_rndup(len);
385
386	while (paddedlen) {
387		if (!nmc->nmc_left) {
388			error = nfsm_chain_new_mbuf(nmc, paddedlen);
389			if (error)
390				return (error);
391		}
392		tlen = MIN(nmc->nmc_left, paddedlen);
393		if (tlen) {
394			if (len) {
395				if (tlen > len)
396					tlen = len;
397				bcopy(buf, nmc->nmc_ptr, tlen);
398			} else {
399				bzero(nmc->nmc_ptr, tlen);
400			}
401			nmc->nmc_ptr += tlen;
402			nmc->nmc_left -= tlen;
403			paddedlen -= tlen;
404			if (len) {
405				buf += tlen;
406				len -= tlen;
407			}
408		}
409	}
410	return (0);
411}
412
413/*
414 * nfsm_chain_add_opaque_nopad_f()
415 *
416 * Add "len" bytes of opaque data pointed to by "buf" to the given chain.
417 * Do not XDR pad.
418 */
419int
420nfsm_chain_add_opaque_nopad_f(struct nfsm_chain *nmc, const u_char *buf, uint32_t len)
421{
422	uint32_t tlen;
423	int error;
424
425	while (len > 0) {
426		if (nmc->nmc_left <= 0) {
427			error = nfsm_chain_new_mbuf(nmc, len);
428			if (error)
429				return (error);
430		}
431		tlen = MIN(nmc->nmc_left, len);
432		bcopy(buf, nmc->nmc_ptr, tlen);
433		nmc->nmc_ptr += tlen;
434		nmc->nmc_left -= tlen;
435		len -= tlen;
436		buf += tlen;
437	}
438	return (0);
439}
440
441/*
442 * nfsm_chain_add_uio()
443 *
444 * Add "len" bytes of data from "uio" to the given chain.
445 */
446int
447nfsm_chain_add_uio(struct nfsm_chain *nmc, uio_t uio, uint32_t len)
448{
449	uint32_t paddedlen, tlen;
450	int error;
451
452	paddedlen = nfsm_rndup(len);
453
454	while (paddedlen) {
455		if (!nmc->nmc_left) {
456			error = nfsm_chain_new_mbuf(nmc, paddedlen);
457			if (error)
458				return (error);
459		}
460		tlen = MIN(nmc->nmc_left, paddedlen);
461		if (tlen) {
462			if (len) {
463				if (tlen > len)
464					tlen = len;
465				uiomove(nmc->nmc_ptr, tlen, uio);
466			} else {
467				bzero(nmc->nmc_ptr, tlen);
468			}
469			nmc->nmc_ptr += tlen;
470			nmc->nmc_left -= tlen;
471			paddedlen -= tlen;
472			if (len)
473				len -= tlen;
474		}
475	}
476	return (0);
477}
478
479/*
480 * Find the length of the NFS mbuf chain
481 * up to the current encoding/decoding offset.
482 */
483int
484nfsm_chain_offset(struct nfsm_chain *nmc)
485{
486	mbuf_t mb;
487	int len = 0;
488
489	for (mb = nmc->nmc_mhead; mb; mb = mbuf_next(mb)) {
490		if (mb == nmc->nmc_mcur)
491			return (len + (nmc->nmc_ptr - (caddr_t) mbuf_data(mb)));
492		len += mbuf_len(mb);
493	}
494
495	return (len);
496}
497
498/*
499 * nfsm_chain_advance()
500 *
501 * Advance an nfsm_chain by "len" bytes.
502 */
503int
504nfsm_chain_advance(struct nfsm_chain *nmc, uint32_t len)
505{
506	mbuf_t mb;
507
508	while (len) {
509		if (nmc->nmc_left >= len) {
510			nmc->nmc_left -= len;
511			nmc->nmc_ptr += len;
512			return (0);
513		}
514		len -= nmc->nmc_left;
515		nmc->nmc_mcur = mb = mbuf_next(nmc->nmc_mcur);
516		if (!mb)
517			return (EBADRPC);
518		nmc->nmc_ptr = mbuf_data(mb);
519		nmc->nmc_left = mbuf_len(mb);
520	}
521
522	return (0);
523}
524
525/*
526 * nfsm_chain_reverse()
527 *
528 * Reverse decode offset in an nfsm_chain by "len" bytes.
529 */
530int
531nfsm_chain_reverse(struct nfsm_chain *nmc, uint32_t len)
532{
533	uint32_t mlen, new_offset;
534	int error = 0;
535
536	mlen = nmc->nmc_ptr - (caddr_t) mbuf_data(nmc->nmc_mcur);
537	if (len <= mlen) {
538		nmc->nmc_ptr -= len;
539		nmc->nmc_left += len;
540		return (0);
541	}
542
543	new_offset = nfsm_chain_offset(nmc) - len;
544	nfsm_chain_dissect_init(error, nmc, nmc->nmc_mhead);
545	if (error)
546		return (error);
547
548	return (nfsm_chain_advance(nmc, new_offset));
549}
550
551/*
552 * nfsm_chain_get_opaque_pointer_f()
553 *
554 * Return a pointer to the next "len" bytes of contiguous data in
555 * the mbuf chain.  If the next "len" bytes are not contiguous, we
556 * try to manipulate the mbuf chain so that it is.
557 *
558 * The nfsm_chain is advanced by nfsm_rndup("len") bytes.
559 */
560int
561nfsm_chain_get_opaque_pointer_f(struct nfsm_chain *nmc, uint32_t len, u_char **pptr)
562{
563	mbuf_t mbcur, mb;
564	uint32_t left, need, mblen, cplen, padlen;
565	u_char *ptr;
566	int error = 0;
567
568	/* move to next mbuf with data */
569	while (nmc->nmc_mcur && (nmc->nmc_left == 0)) {
570		mb = mbuf_next(nmc->nmc_mcur);
571		nmc->nmc_mcur = mb;
572		if (!mb)
573			break;
574		nmc->nmc_ptr = mbuf_data(mb);
575		nmc->nmc_left = mbuf_len(mb);
576	}
577	/* check if we've run out of data */
578	if (!nmc->nmc_mcur)
579		return (EBADRPC);
580
581	/* do we already have a contiguous buffer? */
582	if (nmc->nmc_left >= len) {
583		/* the returned pointer will be the current pointer */
584		*pptr = (u_char*)nmc->nmc_ptr;
585		error = nfsm_chain_advance(nmc, nfsm_rndup(len));
586		return (error);
587	}
588
589	padlen = nfsm_rndup(len) - len;
590
591	/* we need (len - left) more bytes */
592	mbcur = nmc->nmc_mcur;
593	left = nmc->nmc_left;
594	need = len - left;
595
596	if (need > mbuf_trailingspace(mbcur)) {
597		/*
598		 * The needed bytes won't fit in the current mbuf so we'll
599		 * allocate a new mbuf to hold the contiguous range of data.
600		 */
601		nfsm_mbuf_get(error, &mb, len);
602		if (error)
603			return (error);
604		/* double check that this mbuf can hold all the data */
605		if (mbuf_maxlen(mb) < len) {
606			mbuf_free(mb);
607			return (EOVERFLOW);
608		}
609
610		/* the returned pointer will be the new mbuf's data pointer */
611		*pptr = ptr = mbuf_data(mb);
612
613		/* copy "left" bytes to the new mbuf */
614		bcopy(nmc->nmc_ptr, ptr, left);
615		ptr += left;
616		mbuf_setlen(mb, left);
617
618		/* insert the new mbuf between the current and next mbufs */
619		error = mbuf_setnext(mb, mbuf_next(mbcur));
620		if (!error)
621			error = mbuf_setnext(mbcur, mb);
622		if (error) {
623			mbuf_free(mb);
624			return (error);
625		}
626
627		/* reduce current mbuf's length by "left" */
628		mbuf_setlen(mbcur, mbuf_len(mbcur) - left);
629
630		/*
631		 * update nmc's state to point at the end of the mbuf
632		 * where the needed data will be copied to.
633		 */
634		nmc->nmc_mcur = mbcur = mb;
635		nmc->nmc_left = 0;
636		nmc->nmc_ptr = (caddr_t)ptr;
637	} else {
638		/* The rest of the data will fit in this mbuf. */
639
640		/* the returned pointer will be the current pointer */
641		*pptr = (u_char*)nmc->nmc_ptr;
642
643		/*
644		 * update nmc's state to point at the end of the mbuf
645		 * where the needed data will be copied to.
646		 */
647		nmc->nmc_ptr += left;
648		nmc->nmc_left = 0;
649	}
650
651	/*
652	 * move the next "need" bytes into the current
653	 * mbuf from the mbufs that follow
654	 */
655
656	/* extend current mbuf length */
657	mbuf_setlen(mbcur, mbuf_len(mbcur) + need);
658
659	/* mb follows mbufs we're copying/compacting data from */
660	mb = mbuf_next(mbcur);
661
662	while (need && mb) {
663		/* copy as much as we need/can */
664		ptr = mbuf_data(mb);
665		mblen = mbuf_len(mb);
666		cplen = MIN(mblen, need);
667		if (cplen) {
668			bcopy(ptr, nmc->nmc_ptr, cplen);
669			/*
670			 * update the mbuf's pointer and length to reflect that
671			 * the data was shifted to an earlier mbuf in the chain
672			 */
673			error = mbuf_setdata(mb, ptr + cplen, mblen - cplen);
674			if (error) {
675				mbuf_setlen(mbcur, mbuf_len(mbcur) - need);
676				return (error);
677			}
678			/* update pointer/need */
679			nmc->nmc_ptr += cplen;
680			need -= cplen;
681		}
682		/* if more needed, go to next mbuf */
683		if (need)
684			mb = mbuf_next(mb);
685	}
686
687	/* did we run out of data in the mbuf chain? */
688	if (need) {
689		mbuf_setlen(mbcur, mbuf_len(mbcur) - need);
690		return (EBADRPC);
691	}
692
693	/*
694	 * update nmc's state to point after this contiguous data
695	 *
696	 * "mb" points to the last mbuf we copied data from so we
697	 * just set nmc to point at whatever remains in that mbuf.
698	 */
699	nmc->nmc_mcur = mb;
700	nmc->nmc_ptr = mbuf_data(mb);
701	nmc->nmc_left = mbuf_len(mb);
702
703	/* move past any padding */
704	if (padlen)
705		error = nfsm_chain_advance(nmc, padlen);
706
707	return (error);
708}
709
710/*
711 * nfsm_chain_get_opaque_f()
712 *
713 * Read the next "len" bytes in the chain into "buf".
714 * The nfsm_chain is advanced by nfsm_rndup("len") bytes.
715 */
716int
717nfsm_chain_get_opaque_f(struct nfsm_chain *nmc, uint32_t len, u_char *buf)
718{
719	uint32_t cplen, padlen;
720	int error = 0;
721
722	padlen = nfsm_rndup(len) - len;
723
724	/* loop through mbufs copying all the data we need */
725	while (len && nmc->nmc_mcur) {
726		/* copy as much as we need/can */
727		cplen = MIN(nmc->nmc_left, len);
728		if (cplen) {
729			bcopy(nmc->nmc_ptr, buf, cplen);
730			nmc->nmc_ptr += cplen;
731			nmc->nmc_left -= cplen;
732			buf += cplen;
733			len -= cplen;
734		}
735		/* if more needed, go to next mbuf */
736		if (len) {
737			mbuf_t mb = mbuf_next(nmc->nmc_mcur);
738			nmc->nmc_mcur = mb;
739			nmc->nmc_ptr = mb ? mbuf_data(mb) : NULL;
740			nmc->nmc_left = mb ? mbuf_len(mb) : 0;
741		}
742	}
743
744	/* did we run out of data in the mbuf chain? */
745	if (len)
746		return (EBADRPC);
747
748	if (padlen)
749		nfsm_chain_adv(error, nmc, padlen);
750
751	return (error);
752}
753
754/*
755 * nfsm_chain_get_uio()
756 *
757 * Read the next "len" bytes in the chain into the given uio.
758 * The nfsm_chain is advanced by nfsm_rndup("len") bytes.
759 */
760int
761nfsm_chain_get_uio(struct nfsm_chain *nmc, uint32_t len, uio_t uio)
762{
763	uint32_t cplen, padlen;
764	int error = 0;
765
766	padlen = nfsm_rndup(len) - len;
767
768	/* loop through mbufs copying all the data we need */
769	while (len && nmc->nmc_mcur) {
770		/* copy as much as we need/can */
771		cplen = MIN(nmc->nmc_left, len);
772		if (cplen) {
773			error = uiomove(nmc->nmc_ptr, cplen, uio);
774			if (error)
775				return (error);
776			nmc->nmc_ptr += cplen;
777			nmc->nmc_left -= cplen;
778			len -= cplen;
779		}
780		/* if more needed, go to next mbuf */
781		if (len) {
782			mbuf_t mb = mbuf_next(nmc->nmc_mcur);
783			nmc->nmc_mcur = mb;
784			nmc->nmc_ptr = mb ? mbuf_data(mb) : NULL;
785			nmc->nmc_left = mb ? mbuf_len(mb) : 0;
786		}
787	}
788
789	/* did we run out of data in the mbuf chain? */
790	if (len)
791		return (EBADRPC);
792
793	if (padlen)
794		nfsm_chain_adv(error, nmc, padlen);
795
796	return (error);
797}
798
799#if NFSCLIENT
800
801int
802nfsm_chain_add_string_nfc(struct nfsm_chain *nmc, const uint8_t *s, uint32_t slen)
803{
804	uint8_t smallbuf[64];
805	uint8_t *nfcname = smallbuf;
806	size_t buflen = sizeof(smallbuf), nfclen;
807	int error;
808
809	error = utf8_normalizestr(s, slen, nfcname, &nfclen, buflen, UTF_PRECOMPOSED|UTF_NO_NULL_TERM);
810	if (error == ENAMETOOLONG) {
811		buflen = MAXPATHLEN;
812		MALLOC_ZONE(nfcname, uint8_t *, MAXPATHLEN, M_NAMEI, M_WAITOK);
813		if (nfcname)
814			error = utf8_normalizestr(s, slen, nfcname, &nfclen, buflen, UTF_PRECOMPOSED|UTF_NO_NULL_TERM);
815	}
816
817	/* if we got an error, just use the original string */
818	if (error)
819		nfsm_chain_add_string(error, nmc, s, slen);
820	else
821		nfsm_chain_add_string(error, nmc, nfcname, nfclen);
822
823	if (nfcname && (nfcname != smallbuf))
824		FREE_ZONE(nfcname, MAXPATHLEN, M_NAMEI);
825	return (error);
826}
827
828/*
829 * Add an NFSv2 "sattr" structure to an mbuf chain
830 */
831int
832nfsm_chain_add_v2sattr_f(struct nfsm_chain *nmc, struct vnode_attr *vap, uint32_t szrdev)
833{
834	int error = 0;
835
836	nfsm_chain_add_32(error, nmc, vtonfsv2_mode(vap->va_type,
837		(VATTR_IS_ACTIVE(vap, va_mode) ? vap->va_mode : 0600)));
838	nfsm_chain_add_32(error, nmc,
839		VATTR_IS_ACTIVE(vap, va_uid) ? vap->va_uid : (uint32_t)-1);
840	nfsm_chain_add_32(error, nmc,
841		VATTR_IS_ACTIVE(vap, va_gid) ? vap->va_gid : (uint32_t)-1);
842	nfsm_chain_add_32(error, nmc, szrdev);
843	nfsm_chain_add_v2time(error, nmc,
844		VATTR_IS_ACTIVE(vap, va_access_time) ?
845		&vap->va_access_time : NULL);
846	nfsm_chain_add_v2time(error, nmc,
847		VATTR_IS_ACTIVE(vap, va_modify_time) ?
848		&vap->va_modify_time : NULL);
849
850	return (error);
851}
852
853/*
854 * Add an NFSv3 "sattr" structure to an mbuf chain
855 */
856int
857nfsm_chain_add_v3sattr_f(struct nfsm_chain *nmc, struct vnode_attr *vap)
858{
859	int error = 0;
860
861	if (VATTR_IS_ACTIVE(vap, va_mode)) {
862		nfsm_chain_add_32(error, nmc, TRUE);
863		nfsm_chain_add_32(error, nmc, vap->va_mode);
864	} else {
865		nfsm_chain_add_32(error, nmc, FALSE);
866	}
867	if (VATTR_IS_ACTIVE(vap, va_uid)) {
868		nfsm_chain_add_32(error, nmc, TRUE);
869		nfsm_chain_add_32(error, nmc, vap->va_uid);
870	} else {
871		nfsm_chain_add_32(error, nmc, FALSE);
872	}
873	if (VATTR_IS_ACTIVE(vap, va_gid)) {
874		nfsm_chain_add_32(error, nmc, TRUE);
875		nfsm_chain_add_32(error, nmc, vap->va_gid);
876	} else {
877		nfsm_chain_add_32(error, nmc, FALSE);
878	}
879	if (VATTR_IS_ACTIVE(vap, va_data_size)) {
880		nfsm_chain_add_32(error, nmc, TRUE);
881		nfsm_chain_add_64(error, nmc, vap->va_data_size);
882	} else {
883		nfsm_chain_add_32(error, nmc, FALSE);
884	}
885	if (vap->va_vaflags & VA_UTIMES_NULL) {
886		nfsm_chain_add_32(error, nmc, NFS_TIME_SET_TO_SERVER);
887		nfsm_chain_add_32(error, nmc, NFS_TIME_SET_TO_SERVER);
888	} else {
889		if (VATTR_IS_ACTIVE(vap, va_access_time)) {
890			nfsm_chain_add_32(error, nmc, NFS_TIME_SET_TO_CLIENT);
891			nfsm_chain_add_32(error, nmc, vap->va_access_time.tv_sec);
892			nfsm_chain_add_32(error, nmc, vap->va_access_time.tv_nsec);
893		} else {
894			nfsm_chain_add_32(error, nmc, NFS_TIME_DONT_CHANGE);
895		}
896		if (VATTR_IS_ACTIVE(vap, va_modify_time)) {
897			nfsm_chain_add_32(error, nmc, NFS_TIME_SET_TO_CLIENT);
898			nfsm_chain_add_32(error, nmc, vap->va_modify_time.tv_sec);
899			nfsm_chain_add_32(error, nmc, vap->va_modify_time.tv_nsec);
900		} else {
901			nfsm_chain_add_32(error, nmc, NFS_TIME_DONT_CHANGE);
902		}
903	}
904
905	return (error);
906}
907
908
909/*
910 * nfsm_chain_get_fh_attr()
911 *
912 * Get the file handle and attributes from an mbuf chain. (NFSv2/v3)
913 */
914int
915nfsm_chain_get_fh_attr(
916	struct nfsm_chain *nmc,
917	nfsnode_t dnp,
918	vfs_context_t ctx,
919	int nfsvers,
920	uint64_t *xidp,
921	fhandle_t *fhp,
922	struct nfs_vattr *nvap)
923{
924	int error = 0, gotfh, gotattr;
925
926	gotfh = gotattr = 1;
927
928	if (nfsvers == NFS_VER3) /* check for file handle */
929		nfsm_chain_get_32(error, nmc, gotfh);
930	if (!error && gotfh) /* get file handle */
931		nfsm_chain_get_fh(error, nmc, nfsvers, fhp);
932	else
933		fhp->fh_len = 0;
934	if (nfsvers == NFS_VER3) /* check for file attributes */
935		nfsm_chain_get_32(error, nmc, gotattr);
936	nfsmout_if(error);
937	if (gotattr) {
938		if (!gotfh) /* skip attributes */
939			nfsm_chain_adv(error, nmc, NFSX_V3FATTR);
940		else /* get attributes */
941			error = nfs_parsefattr(nmc, nfsvers, nvap);
942	} else if (gotfh) {
943		/* we need valid attributes in order to call nfs_nget() */
944		if (nfs3_getattr_rpc(NULL, NFSTOMP(dnp), fhp->fh_data, fhp->fh_len, 0, ctx, nvap, xidp)) {
945			gotattr = 0;
946			fhp->fh_len = 0;
947		}
948	}
949nfsmout:
950	return (error);
951}
952
953/*
954 * Get and process NFSv3 WCC data from an mbuf chain
955 */
956int
957nfsm_chain_get_wcc_data_f(
958	struct nfsm_chain *nmc,
959	nfsnode_t np,
960	struct timespec *premtime,
961	int *newpostattr,
962	u_int64_t *xidp)
963{
964	int error = 0;
965	uint32_t flag = 0;
966
967	nfsm_chain_get_32(error, nmc, flag);
968	if (!error && flag) {
969		nfsm_chain_adv(error, nmc, 2 * NFSX_UNSIGNED);
970		nfsm_chain_get_32(error, nmc, premtime->tv_sec);
971		nfsm_chain_get_32(error, nmc, premtime->tv_nsec);
972		nfsm_chain_adv(error, nmc, 2 * NFSX_UNSIGNED);
973	} else {
974		premtime->tv_sec = 0;
975		premtime->tv_nsec = 0;
976	}
977	nfsm_chain_postop_attr_update_flag(error, nmc, np, *newpostattr, xidp);
978
979	return (error);
980}
981
982/*
983 * Get the next RPC transaction ID (XID)
984 */
985void
986nfs_get_xid(uint64_t *xidp)
987{
988	struct timeval tv;
989
990	lck_mtx_lock(nfs_request_mutex);
991	if (!nfs_xid) {
992		/*
993		 * Derive initial xid from system time.
994		 *
995		 * Note: it's OK if this code inits nfs_xid to 0 (for example,
996		 * due to a broken clock) because we immediately increment it
997		 * and we guarantee to never use xid 0.  So, nfs_xid should only
998		 * ever be 0 the first time this function is called.
999		 */
1000		microtime(&tv);
1001		nfs_xid = tv.tv_sec << 12;
1002	}
1003	if (++nfs_xid == 0) {
1004		/* Skip zero xid if it should ever happen. */
1005		nfs_xidwrap++;
1006		nfs_xid++;
1007	}
1008	*xidp = nfs_xid + ((uint64_t)nfs_xidwrap << 32);
1009	lck_mtx_unlock(nfs_request_mutex);
1010}
1011
1012/*
1013 * Build the RPC header and fill in the authorization info.
1014 * Returns the head of the mbuf list and the xid.
1015 */
1016
1017int
1018nfsm_rpchead(
1019	struct nfsreq *req,
1020	mbuf_t mrest,
1021	u_int64_t *xidp,
1022	mbuf_t *mreqp)
1023{
1024	struct nfsmount *nmp = req->r_nmp;
1025	int nfsvers = nmp->nm_vers;
1026	int proc = ((nfsvers == NFS_VER2) ? nfsv2_procid[req->r_procnum] : (int)req->r_procnum);
1027
1028	return nfsm_rpchead2(nmp, nmp->nm_sotype, NFS_PROG, nfsvers, proc,
1029			req->r_auth, req->r_cred, req, mrest, xidp, mreqp);
1030}
1031
1032int
1033nfsm_rpchead2(struct nfsmount *nmp, int sotype, int prog, int vers, int proc, int auth_type,
1034	kauth_cred_t cred, struct nfsreq *req, mbuf_t mrest, u_int64_t *xidp, mbuf_t *mreqp)
1035{
1036	mbuf_t mreq, mb;
1037	int error, i, grpsiz, auth_len = 0, authsiz, reqlen;
1038	size_t headlen;
1039	struct nfsm_chain nmreq;
1040
1041	/* calculate expected auth length */
1042	switch (auth_type) {
1043		case RPCAUTH_NONE:
1044			auth_len = 0;
1045			break;
1046		case RPCAUTH_SYS:
1047		    {
1048			gid_t grouplist[NGROUPS];
1049			int groupcount = NGROUPS;
1050
1051			if (!cred)
1052				return (EINVAL);
1053
1054			(void)kauth_cred_getgroups(cred, grouplist, &groupcount);
1055			if (groupcount < 1)
1056				return (EINVAL);
1057
1058			auth_len = (((((uint32_t)groupcount - 1) > nmp->nm_numgrps) ?
1059				nmp->nm_numgrps : (groupcount - 1)) << 2) +
1060				5 * NFSX_UNSIGNED;
1061			break;
1062		    }
1063		case RPCAUTH_KRB5:
1064		case RPCAUTH_KRB5I:
1065		case RPCAUTH_KRB5P:
1066			if (!req || !cred)
1067				return (EINVAL);
1068			auth_len = 5 * NFSX_UNSIGNED + 0; // zero context handle for now
1069			break;
1070		default:
1071			return (EINVAL);
1072		}
1073	authsiz = nfsm_rndup(auth_len);
1074
1075	/* allocate the packet */
1076	headlen = authsiz + 10 * NFSX_UNSIGNED;
1077	if (sotype == SOCK_STREAM) /* also include room for any RPC Record Mark */
1078		headlen += NFSX_UNSIGNED;
1079	if (headlen >= nfs_mbuf_minclsize) {
1080		error = mbuf_getpacket(MBUF_WAITOK, &mreq);
1081	} else {
1082		error = mbuf_gethdr(MBUF_WAITOK, MBUF_TYPE_DATA, &mreq);
1083		if (!error) {
1084			if (headlen < nfs_mbuf_mhlen)
1085				mbuf_align_32(mreq, headlen);
1086			else
1087				mbuf_align_32(mreq, 8 * NFSX_UNSIGNED);
1088		}
1089	}
1090	if (error) {
1091		/* unable to allocate packet */
1092		/* XXX should we keep statistics for these errors? */
1093		return (error);
1094	}
1095
1096	/*
1097	 * If the caller gave us a non-zero XID then use it because
1098	 * it may be a higher-level resend with a GSSAPI credential.
1099	 * Otherwise, allocate a new one.
1100	 */
1101	if (*xidp == 0)
1102		nfs_get_xid(xidp);
1103
1104	/* build the header(s) */
1105	nfsm_chain_init(&nmreq, mreq);
1106
1107	/* First, if it's a TCP stream insert space for an RPC record mark */
1108	if (sotype == SOCK_STREAM)
1109		nfsm_chain_add_32(error, &nmreq, 0);
1110
1111	/* Then the RPC header. */
1112	nfsm_chain_add_32(error, &nmreq, (*xidp & 0xffffffff));
1113	nfsm_chain_add_32(error, &nmreq, RPC_CALL);
1114	nfsm_chain_add_32(error, &nmreq, RPC_VER2);
1115	nfsm_chain_add_32(error, &nmreq, prog);
1116	nfsm_chain_add_32(error, &nmreq, vers);
1117	nfsm_chain_add_32(error, &nmreq, proc);
1118
1119add_cred:
1120	switch (auth_type) {
1121	case RPCAUTH_NONE:
1122		nfsm_chain_add_32(error, &nmreq, RPCAUTH_NONE); /* auth */
1123		nfsm_chain_add_32(error, &nmreq, 0);		/* length */
1124		nfsm_chain_add_32(error, &nmreq, RPCAUTH_NONE);	/* verf */
1125		nfsm_chain_add_32(error, &nmreq, 0);		/* length */
1126		nfsm_chain_build_done(error, &nmreq);
1127		/* Append the args mbufs */
1128		if (!error)
1129			error = mbuf_setnext(nmreq.nmc_mcur, mrest);
1130		break;
1131	case RPCAUTH_SYS: {
1132		gid_t grouplist[NGROUPS];
1133		int groupcount;
1134
1135		nfsm_chain_add_32(error, &nmreq, RPCAUTH_SYS);
1136		nfsm_chain_add_32(error, &nmreq, authsiz);
1137		nfsm_chain_add_32(error, &nmreq, 0);	/* stamp */
1138		nfsm_chain_add_32(error, &nmreq, 0);	/* zero-length hostname */
1139		nfsm_chain_add_32(error, &nmreq, kauth_cred_getuid(cred));	/* UID */
1140		nfsm_chain_add_32(error, &nmreq, kauth_cred_getgid(cred));	/* GID */
1141		grpsiz = (auth_len >> 2) - 5;
1142		nfsm_chain_add_32(error, &nmreq, grpsiz);/* additional GIDs */
1143		memset(grouplist, 0, sizeof(grouplist));
1144		groupcount = grpsiz;
1145		(void)kauth_cred_getgroups(cred, grouplist, &groupcount);
1146		for (i = 1; i <= grpsiz; i++)
1147			nfsm_chain_add_32(error, &nmreq, grouplist[i]);
1148
1149		/* And the verifier... */
1150		nfsm_chain_add_32(error, &nmreq, RPCAUTH_NONE);	/* flavor */
1151		nfsm_chain_add_32(error, &nmreq, 0);		/* length */
1152		nfsm_chain_build_done(error, &nmreq);
1153
1154		/* Append the args mbufs */
1155		if (!error)
1156			error = mbuf_setnext(nmreq.nmc_mcur, mrest);
1157		break;
1158	}
1159	case RPCAUTH_KRB5:
1160	case RPCAUTH_KRB5I:
1161	case RPCAUTH_KRB5P:
1162		error = nfs_gss_clnt_cred_put(req, &nmreq, mrest);
1163		if (error == ENEEDAUTH) {
1164			gid_t grouplist[NGROUPS];
1165			int groupcount = NGROUPS;
1166			/*
1167			 * Use sec=sys for this user
1168			 */
1169			error = 0;
1170			req->r_auth = auth_type = RPCAUTH_SYS;
1171			(void)kauth_cred_getgroups(cred, grouplist, &groupcount);
1172			auth_len = (((((uint32_t)groupcount - 1) > nmp->nm_numgrps) ?
1173				nmp->nm_numgrps : (groupcount - 1)) << 2) +
1174				5 * NFSX_UNSIGNED;
1175			authsiz = nfsm_rndup(auth_len);
1176			goto add_cred;
1177		}
1178		break;
1179	};
1180
1181	/* finish setting up the packet */
1182	if (!error)
1183		error = mbuf_pkthdr_setrcvif(mreq, 0);
1184
1185	if (error) {
1186		mbuf_freem(mreq);
1187		return (error);
1188	}
1189
1190	/* Calculate the size of the request */
1191	reqlen = 0;
1192	for (mb = nmreq.nmc_mhead; mb; mb = mbuf_next(mb))
1193		reqlen += mbuf_len(mb);
1194
1195	mbuf_pkthdr_setlen(mreq, reqlen);
1196
1197	/*
1198	 * If the request goes on a TCP stream,
1199	 * set its size in the RPC record mark.
1200	 * The record mark count doesn't include itself
1201	 * and the last fragment bit is set.
1202	 */
1203	if (sotype == SOCK_STREAM)
1204		nfsm_chain_set_recmark(error, &nmreq,
1205			(reqlen - NFSX_UNSIGNED) | 0x80000000);
1206
1207	*mreqp = mreq;
1208	return (0);
1209}
1210
1211/*
1212 * Parse an NFS file attribute structure out of an mbuf chain.
1213 */
1214int
1215nfs_parsefattr(struct nfsm_chain *nmc, int nfsvers, struct nfs_vattr *nvap)
1216{
1217	int error = 0;
1218	enum vtype vtype;
1219	nfstype nvtype;
1220	u_short vmode;
1221	uint32_t val, val2;
1222	dev_t rdev;
1223
1224	val = val2 = 0;
1225	NVATTR_INIT(nvap);
1226
1227	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_TYPE);
1228	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_MODE);
1229	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_NUMLINKS);
1230	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_OWNER);
1231	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_OWNER_GROUP);
1232	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_SIZE);
1233	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_SPACE_USED);
1234	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_RAWDEV);
1235	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_FSID);
1236	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_FILEID);
1237	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_TIME_ACCESS);
1238	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_TIME_MODIFY);
1239	NFS_BITMAP_SET(nvap->nva_bitmap, NFS_FATTR_TIME_METADATA);
1240
1241	nfsm_chain_get_32(error, nmc, nvtype);
1242	nfsm_chain_get_32(error, nmc, vmode);
1243	nfsmout_if(error);
1244
1245	if (nfsvers == NFS_VER3) {
1246		nvap->nva_type = vtype = nfstov_type(nvtype, nfsvers);
1247	} else {
1248		/*
1249		 * The duplicate information returned in fa_type and fa_mode
1250		 * is an ambiguity in the NFS version 2 protocol.
1251		 *
1252		 * VREG should be taken literally as a regular file.  If a
1253		 * server intends to return some type information differently
1254		 * in the upper bits of the mode field (e.g. for sockets, or
1255		 * FIFOs), NFSv2 mandates fa_type to be VNON.  Anyway, we
1256		 * leave the examination of the mode bits even in the VREG
1257		 * case to avoid breakage for bogus servers, but we make sure
1258		 * that there are actually type bits set in the upper part of
1259		 * fa_mode (and failing that, trust the va_type field).
1260		 *
1261		 * NFSv3 cleared the issue, and requires fa_mode to not
1262		 * contain any type information (while also introducing
1263		 * sockets and FIFOs for fa_type).
1264		 */
1265		vtype = nfstov_type(nvtype, nfsvers);
1266		if ((vtype == VNON) || ((vtype == VREG) && ((vmode & S_IFMT) != 0)))
1267			vtype = IFTOVT(vmode);
1268		nvap->nva_type = vtype;
1269	}
1270
1271	nvap->nva_mode = (vmode & 07777);
1272
1273	nfsm_chain_get_32(error, nmc, nvap->nva_nlink);
1274	nfsm_chain_get_32(error, nmc, nvap->nva_uid);
1275	nfsm_chain_get_32(error, nmc, nvap->nva_gid);
1276
1277	if (nfsvers == NFS_VER3) {
1278		nfsm_chain_get_64(error, nmc, nvap->nva_size);
1279		nfsm_chain_get_64(error, nmc, nvap->nva_bytes);
1280		nfsm_chain_get_32(error, nmc, nvap->nva_rawdev.specdata1);
1281		nfsm_chain_get_32(error, nmc, nvap->nva_rawdev.specdata2);
1282		nfsmout_if(error);
1283		nfsm_chain_get_64(error, nmc, nvap->nva_fsid.major);
1284		nvap->nva_fsid.minor = 0;
1285		nfsm_chain_get_64(error, nmc, nvap->nva_fileid);
1286	} else {
1287		nfsm_chain_get_32(error, nmc, nvap->nva_size);
1288		nfsm_chain_adv(error, nmc, NFSX_UNSIGNED);
1289		nfsm_chain_get_32(error, nmc, rdev);
1290		nfsmout_if(error);
1291		nvap->nva_rawdev.specdata1 = major(rdev);
1292		nvap->nva_rawdev.specdata2 = minor(rdev);
1293		nfsm_chain_get_32(error, nmc, val); /* blocks */
1294		nfsmout_if(error);
1295		nvap->nva_bytes = val * NFS_FABLKSIZE;
1296		nfsm_chain_get_32(error, nmc, val);
1297		nfsmout_if(error);
1298		nvap->nva_fsid.major = (uint64_t)val;
1299		nvap->nva_fsid.minor = 0;
1300		nfsm_chain_get_32(error, nmc, val);
1301		nfsmout_if(error);
1302		nvap->nva_fileid = (uint64_t)val;
1303		/* Really ugly NFSv2 kludge. */
1304		if ((vtype == VCHR) && (rdev == (dev_t)0xffffffff))
1305			nvap->nva_type = VFIFO;
1306	}
1307	nfsm_chain_get_time(error, nmc, nfsvers,
1308		nvap->nva_timesec[NFSTIME_ACCESS],
1309		nvap->nva_timensec[NFSTIME_ACCESS]);
1310	nfsm_chain_get_time(error, nmc, nfsvers,
1311		nvap->nva_timesec[NFSTIME_MODIFY],
1312		nvap->nva_timensec[NFSTIME_MODIFY]);
1313	nfsm_chain_get_time(error, nmc, nfsvers,
1314		nvap->nva_timesec[NFSTIME_CHANGE],
1315		nvap->nva_timensec[NFSTIME_CHANGE]);
1316nfsmout:
1317	return (error);
1318}
1319
1320/*
1321 * Load the attribute cache (that lives in the nfsnode entry) with
1322 * the value pointed to by nvap, unless the file type in the attribute
1323 * cache doesn't match the file type in the nvap, in which case log a
1324 * warning and return ESTALE.
1325 *
1326 * If the dontshrink flag is set, then it's not safe to call ubc_setsize()
1327 * to shrink the size of the file.
1328 */
1329int
1330nfs_loadattrcache(
1331	nfsnode_t np,
1332	struct nfs_vattr *nvap,
1333	u_int64_t *xidp,
1334	int dontshrink)
1335{
1336	mount_t mp;
1337	vnode_t vp;
1338	struct timeval now;
1339	struct nfs_vattr *npnvap;
1340	int xattr = np->n_vattr.nva_flags & NFS_FFLAG_IS_ATTR;
1341	int referral = np->n_vattr.nva_flags & NFS_FFLAG_TRIGGER_REFERRAL;
1342	int aclbit, monitored, error = 0;
1343	kauth_acl_t acl;
1344	struct nfsmount *nmp;
1345	uint32_t events = np->n_events;
1346
1347	if (np->n_hflag & NHINIT) {
1348		vp = NULL;
1349		mp = np->n_mount;
1350	} else {
1351		vp = NFSTOV(np);
1352		mp = vnode_mount(vp);
1353	}
1354	monitored = vp ? vnode_ismonitored(vp) : 0;
1355
1356	FSDBG_TOP(527, np, vp, *xidp >> 32, *xidp);
1357
1358	if (!((nmp = VFSTONFS(mp)))) {
1359		FSDBG_BOT(527, ENXIO, 1, 0, *xidp);
1360		return (ENXIO);
1361	}
1362
1363	if (*xidp < np->n_xid) {
1364		/*
1365		 * We have already updated attributes with a response from
1366		 * a later request.  The attributes we have here are probably
1367		 * stale so we drop them (just return).  However, our
1368		 * out-of-order receipt could be correct - if the requests were
1369		 * processed out of order at the server.  Given the uncertainty
1370		 * we invalidate our cached attributes.  *xidp is zeroed here
1371		 * to indicate the attributes were dropped - only getattr
1372		 * cares - it needs to retry the rpc.
1373		 */
1374		NATTRINVALIDATE(np);
1375		FSDBG_BOT(527, 0, np, np->n_xid, *xidp);
1376		*xidp = 0;
1377		return (0);
1378	}
1379
1380	if (vp && (nvap->nva_type != vnode_vtype(vp))) {
1381		/*
1382		 * The filehandle has changed type on us.  This can be
1383		 * caused by either the server not having unique filehandles
1384		 * or because another client has removed the previous
1385		 * filehandle and a new object (of a different type)
1386		 * has been created with the same filehandle.
1387		 *
1388		 * We can't simply switch the type on the vnode because
1389		 * there may be type-specific fields that need to be
1390		 * cleaned up or set up.
1391		 *
1392		 * So, what should we do with this vnode?
1393		 *
1394		 * About the best we can do is log a warning and return
1395		 * an error.  ESTALE is about the closest error, but it
1396		 * is a little strange that we come up with this error
1397		 * internally instead of simply passing it through from
1398		 * the server.  Hopefully, the vnode will be reclaimed
1399		 * soon so the filehandle can be reincarnated as the new
1400		 * object type.
1401		 */
1402		printf("nfs loadattrcache vnode changed type, was %d now %d\n",
1403			vnode_vtype(vp), nvap->nva_type);
1404		error = ESTALE;
1405		if (monitored)
1406			events |= VNODE_EVENT_DELETE;
1407		goto out;
1408	}
1409
1410	npnvap = &np->n_vattr;
1411
1412	/*
1413	 * The ACL cache needs special handling because it is not
1414	 * always updated.  Save current ACL cache state so it can
1415	 * be restored after copying the new attributes into place.
1416	 */
1417	aclbit = NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_ACL);
1418	acl = npnvap->nva_acl;
1419
1420	if (monitored) {
1421		/*
1422		 * For monitored nodes, check for attribute changes that should generate events.
1423		 */
1424		if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_NUMLINKS) &&
1425		    (nvap->nva_nlink != npnvap->nva_nlink))
1426			events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_LINK;
1427		if (events & VNODE_EVENT_PERMS)
1428			/* no need to do all the checking if it's already set */;
1429		else if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_MODE) &&
1430			 (nvap->nva_mode != npnvap->nva_mode))
1431			events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1432		else if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_OWNER) &&
1433			 (nvap->nva_uid != npnvap->nva_uid))
1434			events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1435		else if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_OWNER_GROUP) &&
1436			 (nvap->nva_gid != npnvap->nva_gid))
1437			events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1438		else if (nmp->nm_vers >= NFS_VER4) {
1439			if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_OWNER) &&
1440			    !kauth_guid_equal(&nvap->nva_uuuid, &npnvap->nva_uuuid))
1441				events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1442			else if (NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_OWNER_GROUP) &&
1443				 !kauth_guid_equal(&nvap->nva_guuid, &npnvap->nva_guuid))
1444				events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1445			else if ((NFS_BITMAP_ISSET(nvap->nva_bitmap, NFS_FATTR_ACL) &&
1446				 nvap->nva_acl && npnvap->nva_acl &&
1447			         ((nvap->nva_acl->acl_entrycount != npnvap->nva_acl->acl_entrycount) ||
1448			          bcmp(nvap->nva_acl, npnvap->nva_acl, KAUTH_ACL_COPYSIZE(nvap->nva_acl)))))
1449				events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_PERMS;
1450		}
1451		if (((nmp->nm_vers >= NFS_VER4) && (nvap->nva_change != npnvap->nva_change)) ||
1452		   (NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_TIME_MODIFY) &&
1453		    ((nvap->nva_timesec[NFSTIME_MODIFY] != npnvap->nva_timesec[NFSTIME_MODIFY]) ||
1454		     (nvap->nva_timensec[NFSTIME_MODIFY] != npnvap->nva_timensec[NFSTIME_MODIFY]))))
1455			events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_WRITE;
1456		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_RAWDEV) &&
1457		    ((nvap->nva_rawdev.specdata1 != npnvap->nva_rawdev.specdata1) ||
1458		     (nvap->nva_rawdev.specdata2 != npnvap->nva_rawdev.specdata2)))
1459			events |= VNODE_EVENT_ATTRIB;
1460		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_FILEID) &&
1461		    (nvap->nva_fileid != npnvap->nva_fileid))
1462			events |= VNODE_EVENT_ATTRIB;
1463		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_ARCHIVE) &&
1464		    ((nvap->nva_flags & NFS_FFLAG_ARCHIVED) != (npnvap->nva_flags & NFS_FFLAG_ARCHIVED)))
1465			events |= VNODE_EVENT_ATTRIB;
1466		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_HIDDEN) &&
1467		    ((nvap->nva_flags & NFS_FFLAG_HIDDEN) != (npnvap->nva_flags & NFS_FFLAG_HIDDEN)))
1468			events |= VNODE_EVENT_ATTRIB;
1469		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_TIME_CREATE) &&
1470		    ((nvap->nva_timesec[NFSTIME_CREATE] != npnvap->nva_timesec[NFSTIME_CREATE]) ||
1471		     (nvap->nva_timensec[NFSTIME_CREATE] != npnvap->nva_timensec[NFSTIME_CREATE])))
1472			events |= VNODE_EVENT_ATTRIB;
1473		if (!events && NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_TIME_BACKUP) &&
1474		    ((nvap->nva_timesec[NFSTIME_BACKUP] != npnvap->nva_timesec[NFSTIME_BACKUP]) ||
1475		     (nvap->nva_timensec[NFSTIME_BACKUP] != npnvap->nva_timensec[NFSTIME_BACKUP])))
1476			events |= VNODE_EVENT_ATTRIB;
1477	}
1478
1479	/* Copy the attributes to the attribute cache */
1480	bcopy((caddr_t)nvap, (caddr_t)npnvap, sizeof(*nvap));
1481
1482	microuptime(&now);
1483	np->n_attrstamp = now.tv_sec;
1484	np->n_xid = *xidp;
1485	/* NFS_FFLAG_IS_ATTR and NFS_FFLAG_TRIGGER_REFERRAL need to be sticky... */
1486	if (vp && xattr)
1487		nvap->nva_flags |= xattr;
1488	if (vp && referral)
1489		nvap->nva_flags |= referral;
1490
1491	if (NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_ACL)) {
1492		/* we're updating the ACL */
1493		if (nvap->nva_acl) {
1494			/* make a copy of the acl for the cache */
1495			npnvap->nva_acl = kauth_acl_alloc(nvap->nva_acl->acl_entrycount);
1496			if (npnvap->nva_acl) {
1497				bcopy(nvap->nva_acl, npnvap->nva_acl, KAUTH_ACL_COPYSIZE(nvap->nva_acl));
1498			} else {
1499				/* can't make a copy to cache, invalidate ACL cache */
1500				NFS_BITMAP_CLR(npnvap->nva_bitmap, NFS_FATTR_ACL);
1501				NACLINVALIDATE(np);
1502				aclbit = 0;
1503			}
1504		}
1505		if (acl) {
1506			kauth_acl_free(acl);
1507			acl = NULL;
1508		}
1509	}
1510	if (NFS_BITMAP_ISSET(npnvap->nva_bitmap, NFS_FATTR_ACL)) {
1511		/* update the ACL timestamp */
1512		np->n_aclstamp = now.tv_sec;
1513	} else {
1514		/* we aren't updating the ACL, so restore original values */
1515		if (aclbit)
1516			NFS_BITMAP_SET(npnvap->nva_bitmap, NFS_FATTR_ACL);
1517		npnvap->nva_acl = acl;
1518	}
1519
1520#if CONFIG_TRIGGERS
1521	/*
1522	 * For NFSv4, if the fsid doesn't match the fsid for the mount, then
1523	 * this node is for a different file system on the server.  So we mark
1524	 * this node as a trigger node that will trigger the mirror mount.
1525	 */
1526	if ((nmp->nm_vers >= NFS_VER4) && (nvap->nva_type == VDIR) &&
1527	    ((np->n_vattr.nva_fsid.major != nmp->nm_fsid.major) ||
1528	     (np->n_vattr.nva_fsid.minor != nmp->nm_fsid.minor)))
1529		np->n_vattr.nva_flags |= NFS_FFLAG_TRIGGER;
1530#endif
1531
1532	if (!vp || (nvap->nva_type != VREG)) {
1533		np->n_size = nvap->nva_size;
1534	} else if (nvap->nva_size != np->n_size) {
1535		FSDBG(527, np, nvap->nva_size, np->n_size, (nvap->nva_type == VREG) | (np->n_flag & NMODIFIED ? 6 : 4));
1536		if (!UBCINFOEXISTS(vp) || (dontshrink && (nvap->nva_size < np->n_size))) {
1537			/* asked not to shrink, so stick with current size */
1538			FSDBG(527, np, np->n_size, np->n_vattr.nva_size, 0xf00d0001);
1539			nvap->nva_size = np->n_size;
1540			NATTRINVALIDATE(np);
1541		} else if ((np->n_flag & NMODIFIED) && (nvap->nva_size < np->n_size)) {
1542			/* if we've modified, stick with larger size */
1543			FSDBG(527, np, np->n_size, np->n_vattr.nva_size, 0xf00d0002);
1544			nvap->nva_size = np->n_size;
1545			npnvap->nva_size = np->n_size;
1546		} else {
1547			/*
1548			 * n_size is protected by the data lock, so we need to
1549			 * defer updating it until it's safe.  We save the new size
1550			 * and set a flag and it'll get updated the next time we get/drop
1551			 * the data lock or the next time we do a getattr.
1552			 */
1553			np->n_newsize = nvap->nva_size;
1554			SET(np->n_flag, NUPDATESIZE);
1555			if (monitored)
1556				events |= VNODE_EVENT_ATTRIB | VNODE_EVENT_EXTEND;
1557		}
1558	}
1559
1560	if (np->n_flag & NCHG) {
1561		if (np->n_flag & NACC) {
1562			nvap->nva_timesec[NFSTIME_ACCESS] = np->n_atim.tv_sec;
1563			nvap->nva_timensec[NFSTIME_ACCESS] = np->n_atim.tv_nsec;
1564		}
1565		if (np->n_flag & NUPD) {
1566			nvap->nva_timesec[NFSTIME_MODIFY] = np->n_mtim.tv_sec;
1567			nvap->nva_timensec[NFSTIME_MODIFY] = np->n_mtim.tv_nsec;
1568		}
1569	}
1570
1571out:
1572	if (monitored && events)
1573		nfs_vnode_notify(np, events);
1574	FSDBG_BOT(527, error, np, np->n_size, *xidp);
1575	return (error);
1576}
1577
1578/*
1579 * Calculate the attribute timeout based on
1580 * how recently the file has been modified.
1581 */
1582int
1583nfs_attrcachetimeout(nfsnode_t np)
1584{
1585	struct nfsmount *nmp;
1586	struct timeval now;
1587	int isdir;
1588	uint32_t timeo;
1589
1590	if (!(nmp = NFSTONMP(np)))
1591		return (0);
1592
1593	isdir = vnode_isdir(NFSTOV(np));
1594
1595	if ((nmp->nm_vers >= NFS_VER4) && (np->n_openflags & N_DELEG_MASK)) {
1596		/* If we have a delegation, we always use the max timeout. */
1597		timeo = isdir ? nmp->nm_acdirmax : nmp->nm_acregmax;
1598	} else if ((np)->n_flag & NMODIFIED) {
1599		/* If we have modifications, we always use the min timeout. */
1600		timeo = isdir ? nmp->nm_acdirmin : nmp->nm_acregmin;
1601	} else {
1602		/* Otherwise, we base the timeout on how old the file seems. */
1603		/* Note that if the client and server clocks are way out of sync, */
1604		/* timeout will probably get clamped to a min or max value */
1605		microtime(&now);
1606		timeo = (now.tv_sec - (np)->n_vattr.nva_timesec[NFSTIME_MODIFY]) / 10;
1607		if (isdir) {
1608			if (timeo < nmp->nm_acdirmin)
1609				timeo = nmp->nm_acdirmin;
1610			else if (timeo > nmp->nm_acdirmax)
1611				timeo = nmp->nm_acdirmax;
1612		} else {
1613			if (timeo < nmp->nm_acregmin)
1614				timeo = nmp->nm_acregmin;
1615			else if (timeo > nmp->nm_acregmax)
1616				timeo = nmp->nm_acregmax;
1617		}
1618	}
1619
1620	return (timeo);
1621}
1622
1623/*
1624 * Check the attribute cache time stamp.
1625 * If the cache is valid, copy contents to *nvaper and return 0
1626 * otherwise return an error.
1627 * Must be called with the node locked.
1628 */
1629int
1630nfs_getattrcache(nfsnode_t np, struct nfs_vattr *nvaper, int flags)
1631{
1632	struct nfs_vattr *nvap;
1633	struct timeval nowup;
1634	int32_t timeo;
1635
1636	/* Check if the attributes are valid. */
1637	if (!NATTRVALID(np) || ((flags & NGA_ACL) && !NACLVALID(np))) {
1638		FSDBG(528, np, 0, 0xffffff01, ENOENT);
1639		OSAddAtomic64(1, &nfsstats.attrcache_misses);
1640		return (ENOENT);
1641	}
1642
1643	/* Verify the cached attributes haven't timed out. */
1644	timeo = nfs_attrcachetimeout(np);
1645	microuptime(&nowup);
1646	if ((nowup.tv_sec - np->n_attrstamp) >= timeo) {
1647		FSDBG(528, np, 0, 0xffffff02, ENOENT);
1648		OSAddAtomic64(1, &nfsstats.attrcache_misses);
1649		return (ENOENT);
1650	}
1651	if ((flags & NGA_ACL) && ((nowup.tv_sec - np->n_aclstamp) >= timeo)) {
1652		FSDBG(528, np, 0, 0xffffff02, ENOENT);
1653		OSAddAtomic64(1, &nfsstats.attrcache_misses);
1654		return (ENOENT);
1655	}
1656
1657	nvap = &np->n_vattr;
1658	FSDBG(528, np, nvap->nva_size, np->n_size, 0xcace);
1659	OSAddAtomic64(1, &nfsstats.attrcache_hits);
1660
1661	if (nvap->nva_type != VREG) {
1662		np->n_size = nvap->nva_size;
1663	} else if (nvap->nva_size != np->n_size) {
1664		FSDBG(528, np, nvap->nva_size, np->n_size, (nvap->nva_type == VREG) | (np->n_flag & NMODIFIED ? 6 : 4));
1665		if ((np->n_flag & NMODIFIED) && (nvap->nva_size < np->n_size)) {
1666			/* if we've modified, stick with larger size */
1667			nvap->nva_size = np->n_size;
1668		} else {
1669			/*
1670			 * n_size is protected by the data lock, so we need to
1671			 * defer updating it until it's safe.  We save the new size
1672			 * and set a flag and it'll get updated the next time we get/drop
1673			 * the data lock or the next time we do a getattr.
1674			 */
1675			np->n_newsize = nvap->nva_size;
1676			SET(np->n_flag, NUPDATESIZE);
1677		}
1678	}
1679
1680	bcopy((caddr_t)nvap, (caddr_t)nvaper, sizeof(struct nfs_vattr));
1681	if (np->n_flag & NCHG) {
1682		if (np->n_flag & NACC) {
1683			nvaper->nva_timesec[NFSTIME_ACCESS] = np->n_atim.tv_sec;
1684			nvaper->nva_timensec[NFSTIME_ACCESS] = np->n_atim.tv_nsec;
1685		}
1686		if (np->n_flag & NUPD) {
1687			nvaper->nva_timesec[NFSTIME_MODIFY] = np->n_mtim.tv_sec;
1688			nvaper->nva_timensec[NFSTIME_MODIFY] = np->n_mtim.tv_nsec;
1689		}
1690	}
1691	if (nvap->nva_acl) {
1692		if (flags & NGA_ACL) {
1693			nvaper->nva_acl = kauth_acl_alloc(nvap->nva_acl->acl_entrycount);
1694			if (!nvaper->nva_acl)
1695				return (ENOMEM);
1696			bcopy(nvap->nva_acl, nvaper->nva_acl, KAUTH_ACL_COPYSIZE(nvap->nva_acl));
1697		} else {
1698			nvaper->nva_acl = NULL;
1699		}
1700	}
1701	return (0);
1702}
1703
1704/*
1705 * When creating file system objects:
1706 * Don't bother setting UID if it's the same as the credential performing the create.
1707 * Don't bother setting GID if it's the same as the directory or credential.
1708 */
1709void
1710nfs_avoid_needless_id_setting_on_create(nfsnode_t dnp, struct vnode_attr *vap, vfs_context_t ctx)
1711{
1712	if (VATTR_IS_ACTIVE(vap, va_uid)) {
1713		if (kauth_cred_getuid(vfs_context_ucred(ctx)) == vap->va_uid) {
1714			VATTR_CLEAR_ACTIVE(vap, va_uid);
1715			VATTR_CLEAR_ACTIVE(vap, va_uuuid);
1716		}
1717	}
1718	if (VATTR_IS_ACTIVE(vap, va_gid)) {
1719		if ((vap->va_gid == dnp->n_vattr.nva_gid) ||
1720		    (kauth_cred_getgid(vfs_context_ucred(ctx)) == vap->va_gid)) {
1721			VATTR_CLEAR_ACTIVE(vap, va_gid);
1722			VATTR_CLEAR_ACTIVE(vap, va_guuid);
1723		}
1724	}
1725}
1726
1727/*
1728 * Convert a universal address string to a sockaddr structure.
1729 *
1730 * Universal addresses can be in the following formats:
1731 *
1732 * d = decimal (IPv4)
1733 * x = hexadecimal (IPv6)
1734 * p = port (decimal)
1735 *
1736 * d.d.d.d
1737 * d.d.d.d.p.p
1738 * x:x:x:x:x:x:x:x
1739 * x:x:x:x:x:x:x:x.p.p
1740 * x:x:x:x:x:x:d.d.d.d
1741 * x:x:x:x:x:x:d.d.d.d.p.p
1742 *
1743 * IPv6 strings can also have a series of zeroes elided
1744 * IPv6 strings can also have a %scope suffix at the end (after any port)
1745 *
1746 * rules & exceptions:
1747 * - value before : is hex
1748 * - value before . is dec
1749 * - once . hit, all values are dec
1750 * - hex+port case means value before first dot is actually hex
1751 * - . is always preceded by digits except if last hex was double-colon
1752 *
1753 * scan, converting #s to bytes
1754 * first time a . is encountered, scan the rest to count them.
1755 * 2 dots = just port
1756 * 3 dots = just IPv4 no port
1757 * 5 dots = IPv4 and port
1758 */
1759
1760#define IS_DIGIT(C) \
1761	(((C) >= '0') && ((C) <= '9'))
1762
1763#define IS_XDIGIT(C) \
1764	(IS_DIGIT(C) || \
1765	 (((C) >= 'A') && ((C) <= 'F')) || \
1766	 (((C) >= 'a') && ((C) <= 'f')))
1767
1768int
1769nfs_uaddr2sockaddr(const char *uaddr, struct sockaddr *addr)
1770{
1771	const char *p, *pd;	/* pointers to current character in scan */
1772	const char *pnum;	/* pointer to current number to decode */
1773	const char *pscope;	/* pointer to IPv6 scope ID */
1774	uint8_t a[18];		/* octet array to store address bytes */
1775	int i;			/* index of next octet to decode */
1776	int dci;		/* index of octet to insert double-colon zeroes */
1777	int dcount, xdcount;	/* count of digits in current number */
1778	int needmore;		/* set when we know we need more input (e.g. after colon, period) */
1779	int dots;		/* # of dots */
1780	int hex;		/* contains hex values */
1781	unsigned long val;	/* decoded value */
1782	int s;			/* index used for sliding array to insert elided zeroes */
1783
1784#define HEXVALUE	0
1785#define DECIMALVALUE	1
1786#define GET(TYPE) \
1787	do { \
1788		if ((dcount <= 0) || (dcount > (((TYPE) == DECIMALVALUE) ? 3 : 4))) \
1789			return (0); \
1790		if (((TYPE) == DECIMALVALUE) && xdcount) \
1791			return (0); \
1792		val = strtoul(pnum, NULL, ((TYPE) == DECIMALVALUE) ? 10 : 16); \
1793		if (((TYPE) == DECIMALVALUE) && (val >= 256)) \
1794			return (0); \
1795		/* check if there is room left in the array */ \
1796		if (i > (int)(sizeof(a) - (((TYPE) == HEXVALUE) ? 2 : 1) - ((dci != -1) ? 2 : 0))) \
1797			return (0); \
1798		if ((TYPE) == HEXVALUE) \
1799			a[i++] = ((val >> 8) & 0xff); \
1800		a[i++] = (val & 0xff); \
1801	} while (0)
1802
1803	hex = 0;
1804	dots = 0;
1805	dci = -1;
1806	i = dcount = xdcount = 0;
1807	pnum = p = uaddr;
1808	pscope = NULL;
1809	needmore = 1;
1810	if ((*p == ':') && (*++p != ':')) /* if it starts with colon, gotta be a double */
1811		return (0);
1812
1813	while (*p) {
1814		if (IS_XDIGIT(*p)) {
1815			dcount++;
1816			if (!IS_DIGIT(*p))
1817				xdcount++;
1818			needmore = 0;
1819			p++;
1820		} else if (*p == '.') {
1821			/* rest is decimal IPv4 dotted quad and/or port */
1822			if (!dots) {
1823				/* this is the first, so count them */
1824				for (pd = p; *pd; pd++) {
1825					if (*pd == '.') {
1826						if (++dots > 5)
1827							return (0);
1828					} else if (hex && (*pd == '%')) {
1829						break;
1830					} else if ((*pd < '0') || (*pd > '9')) {
1831						return (0);
1832					}
1833				}
1834				if ((dots != 2) && (dots != 3) && (dots != 5))
1835					return (0);
1836				if (hex && (dots == 2)) { /* hex+port */
1837					if (!dcount && needmore)
1838						return (0);
1839					if (dcount) /* last hex may be elided zero */
1840						GET(HEXVALUE);
1841				} else {
1842					GET(DECIMALVALUE);
1843				}
1844			} else {
1845				GET(DECIMALVALUE);
1846			}
1847			dcount = xdcount = 0;
1848			needmore = 1;
1849			pnum = ++p;
1850		} else if (*p == ':') {
1851			hex = 1;
1852			if (dots)
1853				return (0);
1854			if (!dcount) { /* missing number, probably double colon */
1855				if (dci >= 0) /* can only have one double colon */
1856					return (0);
1857				dci = i;
1858				needmore = 0;
1859			} else {
1860				GET(HEXVALUE);
1861				dcount = xdcount = 0;
1862				needmore = 1;
1863			}
1864			pnum = ++p;
1865		} else if (*p == '%') { /* scope ID delimiter */
1866			if (!hex)
1867				return (0);
1868			p++;
1869			pscope = p;
1870			break;
1871		} else { /* unexpected character */
1872			return (0);
1873		}
1874	}
1875	if (needmore && !dcount)
1876		return (0);
1877	if (dcount) /* decode trailing number */
1878		GET(dots ? DECIMALVALUE : HEXVALUE);
1879	if (dci >= 0) {  /* got a double-colon at i, need to insert a range of zeroes */
1880		/* if we got a port, slide to end of array */
1881		/* otherwise, slide to end of address (non-port) values */
1882		int end = ((dots == 2) || (dots == 5)) ? sizeof(a) : (sizeof(a) - 2);
1883		if (i % 2) /* length of zero range must be multiple of 2 */
1884			return (0);
1885		if (i >= end) /* no room? */
1886			return (0);
1887		/* slide (i-dci) numbers up from index dci */
1888		for (s=0; s < (i - dci); s++)
1889			a[end-1-s] = a[i-1-s];
1890		/* zero (end-i) numbers at index dci */
1891		for (s=0; s < (end - i); s++)
1892			a[dci+s] = 0;
1893		i = end;
1894	}
1895
1896	/* copy out resulting socket address */
1897	if (hex) {
1898		struct sockaddr_in6 *sin6 = (struct sockaddr_in6*)addr;
1899		if ((((dots == 0) || (dots == 3)) && (i != (sizeof(a)-2))))
1900			return (0);
1901		if ((((dots == 2) || (dots == 5)) && (i != sizeof(a))))
1902			return (0);
1903		bzero(sin6, sizeof(struct sockaddr_in6));
1904		sin6->sin6_len = sizeof(struct sockaddr_in6);
1905		sin6->sin6_family = AF_INET6;
1906		bcopy(a, &sin6->sin6_addr.s6_addr, sizeof(struct in6_addr));
1907		if ((dots == 5) || (dots == 2))
1908			sin6->sin6_port = htons((a[16] << 8) | a[17]);
1909		if (pscope) {
1910			for (p=pscope; IS_DIGIT(*p); p++)
1911				;
1912			if (*p && !IS_DIGIT(*p)) { /* name */
1913				ifnet_t interface = NULL;
1914				if (ifnet_find_by_name(pscope, &interface) == 0)
1915					sin6->sin6_scope_id = ifnet_index(interface);
1916				if (interface)
1917					ifnet_release(interface);
1918			} else { /* decimal number */
1919				sin6->sin6_scope_id = strtoul(pscope, NULL, 10);
1920			}
1921			/* XXX should we also embed scope id for linklocal? */
1922		}
1923	} else {
1924		struct sockaddr_in *sin = (struct sockaddr_in*)addr;
1925		if ((dots != 3) && (dots != 5))
1926			return (0);
1927		if ((dots == 3) && (i != 4))
1928			return (0);
1929		if ((dots == 5) && (i != 6))
1930			return (0);
1931		bzero(sin, sizeof(struct sockaddr_in));
1932		sin->sin_len = sizeof(struct sockaddr_in);
1933		sin->sin_family = AF_INET;
1934		bcopy(a, &sin->sin_addr.s_addr, sizeof(struct in_addr));
1935		if (dots == 5)
1936			sin->sin_port = htons((a[4] << 8) | a[5]);
1937	}
1938	return (1);
1939}
1940
1941
1942#endif /* NFSCLIENT */
1943
1944/*
1945 * Schedule a callout thread to run an NFS timer function
1946 * interval milliseconds in the future.
1947 */
1948void
1949nfs_interval_timer_start(thread_call_t call, int interval)
1950{
1951	uint64_t deadline;
1952
1953	clock_interval_to_deadline(interval, 1000 * 1000, &deadline);
1954	thread_call_enter_delayed(call, deadline);
1955}
1956
1957
1958#if NFSSERVER
1959
1960int nfsrv_cmp_secflavs(struct nfs_sec *, struct nfs_sec *);
1961int nfsrv_hang_addrlist(struct nfs_export *, struct user_nfs_export_args *);
1962int nfsrv_free_netopt(struct radix_node *, void *);
1963int nfsrv_free_addrlist(struct nfs_export *, struct user_nfs_export_args *);
1964struct nfs_export_options *nfsrv_export_lookup(struct nfs_export *, mbuf_t);
1965struct nfs_export *nfsrv_fhtoexport(struct nfs_filehandle *);
1966struct nfs_user_stat_node *nfsrv_get_user_stat_node(struct nfs_active_user_list *, struct sockaddr *, uid_t);
1967void nfsrv_init_user_list(struct nfs_active_user_list *);
1968void nfsrv_free_user_list(struct nfs_active_user_list *);
1969
1970/*
1971 * add NFSv3 WCC data to an mbuf chain
1972 */
1973int
1974nfsm_chain_add_wcc_data_f(
1975	struct nfsrv_descript *nd,
1976	struct nfsm_chain *nmc,
1977	int preattrerr,
1978	struct vnode_attr *prevap,
1979	int postattrerr,
1980	struct vnode_attr *postvap)
1981{
1982	int error = 0;
1983
1984	if (preattrerr) {
1985		nfsm_chain_add_32(error, nmc, FALSE);
1986	} else {
1987		nfsm_chain_add_32(error, nmc, TRUE);
1988		nfsm_chain_add_64(error, nmc, prevap->va_data_size);
1989		nfsm_chain_add_time(error, nmc, NFS_VER3, &prevap->va_modify_time);
1990		nfsm_chain_add_time(error, nmc, NFS_VER3, &prevap->va_change_time);
1991	}
1992	nfsm_chain_add_postop_attr(error, nd, nmc, postattrerr, postvap);
1993
1994	return (error);
1995}
1996
1997/*
1998 * Extract a lookup path from the given mbufs and store it in
1999 * a newly allocated buffer saved in the given nameidata structure.
2000 */
2001int
2002nfsm_chain_get_path_namei(
2003	struct nfsm_chain *nmc,
2004	uint32_t len,
2005	struct nameidata *nip)
2006{
2007	struct componentname *cnp = &nip->ni_cnd;
2008	int error = 0;
2009	char *cp;
2010
2011	if (len > (MAXPATHLEN - 1))
2012		return (ENAMETOOLONG);
2013
2014	/*
2015	 * Get a buffer for the name to be translated, and copy the
2016	 * name into the buffer.
2017	 */
2018	MALLOC_ZONE(cnp->cn_pnbuf, caddr_t, MAXPATHLEN, M_NAMEI, M_WAITOK);
2019	if (!cnp->cn_pnbuf)
2020		return (ENOMEM);
2021	cnp->cn_pnlen = MAXPATHLEN;
2022	cnp->cn_flags |= HASBUF;
2023
2024	/* Copy the name from the mbuf list to the string */
2025	cp = cnp->cn_pnbuf;
2026	nfsm_chain_get_opaque(error, nmc, len, cp);
2027	if (error)
2028		goto out;
2029	cnp->cn_pnbuf[len] = '\0';
2030
2031	/* sanity check the string */
2032	if ((strlen(cp) != len) || strchr(cp, '/'))
2033		error = EACCES;
2034out:
2035	if (error) {
2036		if (cnp->cn_pnbuf)
2037			FREE_ZONE(cnp->cn_pnbuf, MAXPATHLEN, M_NAMEI);
2038		cnp->cn_flags &= ~HASBUF;
2039	} else {
2040		nip->ni_pathlen = len;
2041	}
2042	return (error);
2043}
2044
2045/*
2046 * Set up nameidata for a lookup() call and do it.
2047 */
2048int
2049nfsrv_namei(
2050	struct nfsrv_descript *nd,
2051	vfs_context_t ctx,
2052	struct nameidata *nip,
2053	struct nfs_filehandle *nfhp,
2054	vnode_t *retdirp,
2055	struct nfs_export **nxp,
2056	struct nfs_export_options **nxop)
2057{
2058	vnode_t dp;
2059	int error;
2060	struct componentname *cnp = &nip->ni_cnd;
2061	uint32_t cnflags;
2062	char *tmppn;
2063
2064	*retdirp = NULL;
2065
2066	/*
2067	 * Extract and set starting directory.
2068	 */
2069	error = nfsrv_fhtovp(nfhp, nd, &dp, nxp, nxop);
2070	if (error)
2071		goto out;
2072	error = nfsrv_credcheck(nd, ctx, *nxp, *nxop);
2073	if (error || (vnode_vtype(dp) != VDIR)) {
2074		vnode_put(dp);
2075		error = ENOTDIR;
2076		goto out;
2077	}
2078	*retdirp = dp;
2079
2080	nip->ni_cnd.cn_context = ctx;
2081
2082	if (*nxop && ((*nxop)->nxo_flags & NX_READONLY))
2083		cnp->cn_flags |= RDONLY;
2084
2085	cnp->cn_flags |= NOCROSSMOUNT;
2086	cnp->cn_nameptr = cnp->cn_pnbuf;
2087	nip->ni_usedvp = nip->ni_startdir = dp;
2088
2089	/*
2090	 * And call lookup() to do the real work
2091	 */
2092	cnflags = nip->ni_cnd.cn_flags; /* store in case we have to restore */
2093	while ((error = lookup(nip)) == ERECYCLE) {
2094		nip->ni_cnd.cn_flags = cnflags;
2095		cnp->cn_nameptr = cnp->cn_pnbuf;
2096		nip->ni_usedvp = nip->ni_dvp = nip->ni_startdir = dp;
2097	}
2098	if (error)
2099		goto out;
2100
2101	/* Check for encountering a symbolic link */
2102	if (cnp->cn_flags & ISSYMLINK) {
2103#if CONFIG_VFS_FUNNEL
2104	        if ((cnp->cn_flags & FSNODELOCKHELD)) {
2105		        cnp->cn_flags &= ~FSNODELOCKHELD;
2106			unlock_fsnode(nip->ni_dvp, NULL);
2107		}
2108#endif /* CONFIG_VFS_FUNNEL */
2109		if (cnp->cn_flags & (LOCKPARENT | WANTPARENT))
2110			vnode_put(nip->ni_dvp);
2111		if (nip->ni_vp) {
2112			vnode_put(nip->ni_vp);
2113			nip->ni_vp = NULL;
2114		}
2115		error = EINVAL;
2116	}
2117out:
2118	if (error) {
2119		tmppn = cnp->cn_pnbuf;
2120		cnp->cn_pnbuf = NULL;
2121		cnp->cn_flags &= ~HASBUF;
2122		FREE_ZONE(tmppn, cnp->cn_pnlen, M_NAMEI);
2123	}
2124	return (error);
2125}
2126
2127/*
2128 * A fiddled version of m_adj() that ensures null fill to a 4-byte
2129 * boundary and only trims off the back end
2130 */
2131void
2132nfsm_adj(mbuf_t mp, int len, int nul)
2133{
2134	mbuf_t m, mnext;
2135	int count, i, mlen;
2136	char *cp;
2137
2138	/*
2139	 * Trim from tail.  Scan the mbuf chain,
2140	 * calculating its length and finding the last mbuf.
2141	 * If the adjustment only affects this mbuf, then just
2142	 * adjust and return.  Otherwise, rescan and truncate
2143	 * after the remaining size.
2144	 */
2145	count = 0;
2146	m = mp;
2147	for (;;) {
2148		mlen = mbuf_len(m);
2149		count += mlen;
2150		mnext = mbuf_next(m);
2151		if (mnext == NULL)
2152			break;
2153		m = mnext;
2154	}
2155	if (mlen > len) {
2156		mlen -= len;
2157		mbuf_setlen(m, mlen);
2158		if (nul > 0) {
2159			cp = (caddr_t)mbuf_data(m) + mlen - nul;
2160			for (i = 0; i < nul; i++)
2161				*cp++ = '\0';
2162		}
2163		return;
2164	}
2165	count -= len;
2166	if (count < 0)
2167		count = 0;
2168	/*
2169	 * Correct length for chain is "count".
2170	 * Find the mbuf with last data, adjust its length,
2171	 * and toss data from remaining mbufs on chain.
2172	 */
2173	for (m = mp; m; m = mbuf_next(m)) {
2174		mlen = mbuf_len(m);
2175		if (mlen >= count) {
2176			mlen = count;
2177			mbuf_setlen(m, count);
2178			if (nul > 0) {
2179				cp = (caddr_t)mbuf_data(m) + mlen - nul;
2180				for (i = 0; i < nul; i++)
2181					*cp++ = '\0';
2182			}
2183			break;
2184		}
2185		count -= mlen;
2186	}
2187	for (m = mbuf_next(m); m; m = mbuf_next(m))
2188		mbuf_setlen(m, 0);
2189}
2190
2191/*
2192 * Trim the header out of the mbuf list and trim off any trailing
2193 * junk so that the mbuf list has only the write data.
2194 */
2195int
2196nfsm_chain_trim_data(struct nfsm_chain *nmc, int len, int *mlen)
2197{
2198	int cnt = 0, dlen, adjust;
2199	caddr_t data;
2200	mbuf_t m;
2201
2202	if (mlen)
2203		*mlen = 0;
2204
2205	/* trim header */
2206	for (m = nmc->nmc_mhead; m && (m != nmc->nmc_mcur); m = mbuf_next(m))
2207		mbuf_setlen(m, 0);
2208	if (!m)
2209		return (EIO);
2210
2211	/* trim current mbuf */
2212	data = mbuf_data(m);
2213	dlen = mbuf_len(m);
2214	adjust = nmc->nmc_ptr - data;
2215	dlen -= adjust;
2216	if ((dlen > 0) && (adjust > 0)) {
2217		if (mbuf_setdata(m, nmc->nmc_ptr, dlen))
2218			return(EIO);
2219	} else
2220		mbuf_setlen(m, dlen);
2221
2222	/* skip next len bytes  */
2223	for (; m && (cnt < len); m = mbuf_next(m)) {
2224		dlen = mbuf_len(m);
2225		cnt += dlen;
2226		if (cnt > len) {
2227			/* truncate to end of data */
2228			mbuf_setlen(m, dlen - (cnt - len));
2229			if (m == nmc->nmc_mcur)
2230				nmc->nmc_left -= (cnt - len);
2231			cnt = len;
2232		}
2233	}
2234	if (mlen)
2235		*mlen = cnt;
2236
2237	/* trim any trailing data */
2238	if (m == nmc->nmc_mcur)
2239		nmc->nmc_left = 0;
2240	for (; m; m = mbuf_next(m))
2241		mbuf_setlen(m, 0);
2242
2243	return (0);
2244}
2245
2246int
2247nfsm_chain_add_fattr(
2248	struct nfsrv_descript *nd,
2249	struct nfsm_chain *nmc,
2250	struct vnode_attr *vap)
2251{
2252	int error = 0;
2253
2254	// XXX Should we assert here that all fields are supported?
2255
2256	nfsm_chain_add_32(error, nmc, vtonfs_type(vap->va_type, nd->nd_vers));
2257	if (nd->nd_vers == NFS_VER3) {
2258		nfsm_chain_add_32(error, nmc, vap->va_mode & 07777);
2259	} else {
2260		nfsm_chain_add_32(error, nmc, vtonfsv2_mode(vap->va_type, vap->va_mode));
2261	}
2262	nfsm_chain_add_32(error, nmc, vap->va_nlink);
2263	nfsm_chain_add_32(error, nmc, vap->va_uid);
2264	nfsm_chain_add_32(error, nmc, vap->va_gid);
2265	if (nd->nd_vers == NFS_VER3) {
2266		nfsm_chain_add_64(error, nmc, vap->va_data_size);
2267		nfsm_chain_add_64(error, nmc, vap->va_data_alloc);
2268		nfsm_chain_add_32(error, nmc, major(vap->va_rdev));
2269		nfsm_chain_add_32(error, nmc, minor(vap->va_rdev));
2270		nfsm_chain_add_64(error, nmc, vap->va_fsid);
2271		nfsm_chain_add_64(error, nmc, vap->va_fileid);
2272	} else {
2273		nfsm_chain_add_32(error, nmc, vap->va_data_size);
2274		nfsm_chain_add_32(error, nmc, NFS_FABLKSIZE);
2275		if (vap->va_type == VFIFO)
2276			nfsm_chain_add_32(error, nmc, 0xffffffff);
2277		else
2278			nfsm_chain_add_32(error, nmc, vap->va_rdev);
2279		nfsm_chain_add_32(error, nmc, vap->va_data_alloc / NFS_FABLKSIZE);
2280		nfsm_chain_add_32(error, nmc, vap->va_fsid);
2281		nfsm_chain_add_32(error, nmc, vap->va_fileid);
2282	}
2283	nfsm_chain_add_time(error, nmc, nd->nd_vers, &vap->va_access_time);
2284	nfsm_chain_add_time(error, nmc, nd->nd_vers, &vap->va_modify_time);
2285	nfsm_chain_add_time(error, nmc, nd->nd_vers, &vap->va_change_time);
2286
2287	return (error);
2288}
2289
2290int
2291nfsm_chain_get_sattr(
2292	struct nfsrv_descript *nd,
2293	struct nfsm_chain *nmc,
2294	struct vnode_attr *vap)
2295{
2296	int error = 0;
2297	uint32_t val = 0;
2298	uint64_t val64;
2299	struct timespec now;
2300
2301	if (nd->nd_vers == NFS_VER2) {
2302		/*
2303		 * There is/was a bug in the Sun client that puts 0xffff in the mode
2304		 * field of sattr when it should put in 0xffffffff.  The u_short
2305		 * doesn't sign extend.  So check the low order 2 bytes for 0xffff.
2306		 */
2307		nfsm_chain_get_32(error, nmc, val);
2308		if ((val & 0xffff) != 0xffff) {
2309			VATTR_SET(vap, va_mode, val & 07777);
2310			/* save the "type" bits for NFSv2 create */
2311			VATTR_SET(vap, va_type, IFTOVT(val));
2312			VATTR_CLEAR_ACTIVE(vap, va_type);
2313		}
2314		nfsm_chain_get_32(error, nmc, val);
2315		if (val != (uint32_t)-1)
2316			VATTR_SET(vap, va_uid, val);
2317		nfsm_chain_get_32(error, nmc, val);
2318		if (val != (uint32_t)-1)
2319			VATTR_SET(vap, va_gid, val);
2320		/* save the "size" bits for NFSv2 create (even if they appear unset) */
2321		nfsm_chain_get_32(error, nmc, val);
2322		VATTR_SET(vap, va_data_size, val);
2323		if (val == (uint32_t)-1)
2324			VATTR_CLEAR_ACTIVE(vap, va_data_size);
2325		nfsm_chain_get_time(error, nmc, NFS_VER2,
2326			vap->va_access_time.tv_sec,
2327			vap->va_access_time.tv_nsec);
2328		if (vap->va_access_time.tv_sec != -1)
2329			VATTR_SET_ACTIVE(vap, va_access_time);
2330		nfsm_chain_get_time(error, nmc, NFS_VER2,
2331			vap->va_modify_time.tv_sec,
2332			vap->va_modify_time.tv_nsec);
2333		if (vap->va_modify_time.tv_sec != -1)
2334			VATTR_SET_ACTIVE(vap, va_modify_time);
2335		return (error);
2336	}
2337
2338	/* NFSv3 */
2339	nfsm_chain_get_32(error, nmc, val);
2340	if (val) {
2341		nfsm_chain_get_32(error, nmc, val);
2342		VATTR_SET(vap, va_mode, val & 07777);
2343	}
2344	nfsm_chain_get_32(error, nmc, val);
2345	if (val) {
2346		nfsm_chain_get_32(error, nmc, val);
2347		VATTR_SET(vap, va_uid, val);
2348	}
2349	nfsm_chain_get_32(error, nmc, val);
2350	if (val) {
2351		nfsm_chain_get_32(error, nmc, val);
2352		VATTR_SET(vap, va_gid, val);
2353	}
2354	nfsm_chain_get_32(error, nmc, val);
2355	if (val) {
2356		nfsm_chain_get_64(error, nmc, val64);
2357		VATTR_SET(vap, va_data_size, val64);
2358	}
2359	nanotime(&now);
2360	nfsm_chain_get_32(error, nmc, val);
2361	switch (val) {
2362	case NFS_TIME_SET_TO_CLIENT:
2363		nfsm_chain_get_time(error, nmc, nd->nd_vers,
2364			vap->va_access_time.tv_sec,
2365			vap->va_access_time.tv_nsec);
2366		VATTR_SET_ACTIVE(vap, va_access_time);
2367		vap->va_vaflags &= ~VA_UTIMES_NULL;
2368		break;
2369	case NFS_TIME_SET_TO_SERVER:
2370		VATTR_SET(vap, va_access_time, now);
2371		vap->va_vaflags |= VA_UTIMES_NULL;
2372		break;
2373	}
2374	nfsm_chain_get_32(error, nmc, val);
2375	switch (val) {
2376	case NFS_TIME_SET_TO_CLIENT:
2377		nfsm_chain_get_time(error, nmc, nd->nd_vers,
2378			vap->va_modify_time.tv_sec,
2379			vap->va_modify_time.tv_nsec);
2380		VATTR_SET_ACTIVE(vap, va_modify_time);
2381		vap->va_vaflags &= ~VA_UTIMES_NULL;
2382		break;
2383	case NFS_TIME_SET_TO_SERVER:
2384		VATTR_SET(vap, va_modify_time, now);
2385		if (!VATTR_IS_ACTIVE(vap, va_access_time))
2386			vap->va_vaflags |= VA_UTIMES_NULL;
2387		break;
2388	}
2389
2390	return (error);
2391}
2392
2393/*
2394 * Compare two security flavor structs
2395 */
2396int
2397nfsrv_cmp_secflavs(struct nfs_sec *sf1, struct nfs_sec *sf2)
2398{
2399	int i;
2400
2401	if (sf1->count != sf2->count)
2402		return 1;
2403	for (i = 0; i < sf1->count; i++)
2404		if (sf1->flavors[i] != sf2->flavors[i])
2405			return 1;
2406	return 0;
2407}
2408
2409/*
2410 * Build hash lists of net addresses and hang them off the NFS export.
2411 * Called by nfsrv_export() to set up the lists of export addresses.
2412 */
2413int
2414nfsrv_hang_addrlist(struct nfs_export *nx, struct user_nfs_export_args *unxa)
2415{
2416	struct nfs_export_net_args nxna;
2417	struct nfs_netopt *no, *rn_no;
2418	struct radix_node_head *rnh;
2419	struct radix_node *rn;
2420	struct sockaddr *saddr, *smask;
2421	struct domain *dom;
2422	int i, error;
2423	unsigned int net;
2424	user_addr_t uaddr;
2425	kauth_cred_t cred;
2426
2427	uaddr = unxa->nxa_nets;
2428	for (net = 0; net < unxa->nxa_netcount; net++, uaddr += sizeof(nxna)) {
2429		error = copyin(uaddr, &nxna, sizeof(nxna));
2430		if (error)
2431			return (error);
2432
2433		if (nxna.nxna_flags & (NX_MAPROOT|NX_MAPALL)) {
2434			struct posix_cred temp_pcred;
2435		        bzero(&temp_pcred, sizeof(temp_pcred));
2436			temp_pcred.cr_uid = nxna.nxna_cred.cr_uid;
2437			temp_pcred.cr_ngroups = nxna.nxna_cred.cr_ngroups;
2438			for (i=0; i < nxna.nxna_cred.cr_ngroups && i < NGROUPS; i++)
2439				temp_pcred.cr_groups[i] = nxna.nxna_cred.cr_groups[i];
2440			cred = posix_cred_create(&temp_pcred);
2441			if (!IS_VALID_CRED(cred))
2442				return (ENOMEM);
2443		} else {
2444			cred = NOCRED;
2445		}
2446
2447		if (nxna.nxna_addr.ss_len == 0) {
2448			/* No address means this is a default/world export */
2449			if (nx->nx_flags & NX_DEFAULTEXPORT) {
2450			        if (IS_VALID_CRED(cred))
2451				        kauth_cred_unref(&cred);
2452				return (EEXIST);
2453			}
2454			nx->nx_flags |= NX_DEFAULTEXPORT;
2455			nx->nx_defopt.nxo_flags = nxna.nxna_flags;
2456			nx->nx_defopt.nxo_cred = cred;
2457			bcopy(&nxna.nxna_sec, &nx->nx_defopt.nxo_sec, sizeof(struct nfs_sec));
2458			nx->nx_expcnt++;
2459			continue;
2460		}
2461
2462		i = sizeof(struct nfs_netopt);
2463		i += nxna.nxna_addr.ss_len + nxna.nxna_mask.ss_len;
2464		MALLOC(no, struct nfs_netopt *, i, M_NETADDR, M_WAITOK);
2465		if (!no) {
2466			if (IS_VALID_CRED(cred))
2467				kauth_cred_unref(&cred);
2468			return (ENOMEM);
2469		}
2470		bzero(no, sizeof(struct nfs_netopt));
2471		no->no_opt.nxo_flags = nxna.nxna_flags;
2472		no->no_opt.nxo_cred = cred;
2473		bcopy(&nxna.nxna_sec, &no->no_opt.nxo_sec, sizeof(struct nfs_sec));
2474
2475		saddr = (struct sockaddr *)(no + 1);
2476		bcopy(&nxna.nxna_addr, saddr, nxna.nxna_addr.ss_len);
2477		if (nxna.nxna_mask.ss_len) {
2478			smask = (struct sockaddr *)((caddr_t)saddr + nxna.nxna_addr.ss_len);
2479			bcopy(&nxna.nxna_mask, smask, nxna.nxna_mask.ss_len);
2480		} else {
2481			smask = NULL;
2482		}
2483		i = saddr->sa_family;
2484		if ((rnh = nx->nx_rtable[i]) == 0) {
2485			/*
2486			 * Seems silly to initialize every AF when most are not
2487			 * used, do so on demand here
2488			 */
2489			for (dom = domains; dom; dom = dom->dom_next)
2490				if (dom->dom_family == i && dom->dom_rtattach) {
2491					dom->dom_rtattach((void **)&nx->nx_rtable[i],
2492						dom->dom_rtoffset);
2493					break;
2494				}
2495			if ((rnh = nx->nx_rtable[i]) == 0) {
2496			        if (IS_VALID_CRED(cred))
2497				        kauth_cred_unref(&cred);
2498				_FREE(no, M_NETADDR);
2499				return (ENOBUFS);
2500			}
2501		}
2502		rn = (*rnh->rnh_addaddr)((caddr_t)saddr, (caddr_t)smask, rnh, no->no_rnodes);
2503		if (rn == 0) {
2504			/*
2505			 * One of the reasons that rnh_addaddr may fail is that
2506			 * the entry already exists. To check for this case, we
2507			 * look up the entry to see if it is there. If so, we
2508			 * do not need to make a new entry but do continue.
2509			 *
2510			 * XXX should this be rnh_lookup() instead?
2511			 */
2512			int matched = 0;
2513			rn = (*rnh->rnh_matchaddr)((caddr_t)saddr, rnh);
2514			rn_no = (struct nfs_netopt *)rn;
2515			if (rn != 0 && (rn->rn_flags & RNF_ROOT) == 0 &&
2516			    (rn_no->no_opt.nxo_flags == nxna.nxna_flags) &&
2517			    (!nfsrv_cmp_secflavs(&rn_no->no_opt.nxo_sec, &nxna.nxna_sec))) {
2518				kauth_cred_t cred2 = rn_no->no_opt.nxo_cred;
2519				if (cred == cred2) {
2520					/* creds are same (or both NULL) */
2521					matched = 1;
2522				} else if (cred && cred2 && (kauth_cred_getuid(cred) == kauth_cred_getuid(cred2))) {
2523				    /*
2524				     * Now compare the effective and
2525				     * supplementary groups...
2526				     *
2527				     * Note: This comparison, as written,
2528				     * does not correctly indicate that
2529				     * the groups are equivalent, since
2530				     * other than the first supplementary
2531				     * group, which is also the effective
2532				     * group, order on the remaining groups
2533				     * doesn't matter, and this is an
2534				     * ordered compare.
2535				     */
2536				    gid_t groups[NGROUPS];
2537				    gid_t groups2[NGROUPS];
2538				    int groupcount = NGROUPS;
2539				    int group2count = NGROUPS;
2540
2541				    if (!kauth_cred_getgroups(cred, groups, &groupcount) &&
2542					!kauth_cred_getgroups(cred2, groups2, &group2count) &&
2543					groupcount == group2count) {
2544					    for (i=0; i < group2count; i++)
2545						    if (groups[i] != groups2[i])
2546							    break;
2547					    if (i >= group2count || i >= NGROUPS)
2548					    matched = 1;
2549				    }
2550				}
2551			}
2552			if (IS_VALID_CRED(cred))
2553			        kauth_cred_unref(&cred);
2554			_FREE(no, M_NETADDR);
2555			if (matched)
2556				continue;
2557			return (EPERM);
2558		}
2559		nx->nx_expcnt++;
2560	}
2561
2562	return (0);
2563}
2564
2565/*
2566 * In order to properly track an export's netopt count, we need to pass
2567 * an additional argument to nfsrv_free_netopt() so that it can decrement
2568 * the export's netopt count.
2569 */
2570struct nfsrv_free_netopt_arg {
2571	uint32_t *cnt;
2572	struct radix_node_head *rnh;
2573};
2574
2575int
2576nfsrv_free_netopt(struct radix_node *rn, void *w)
2577{
2578	struct nfsrv_free_netopt_arg *fna = (struct nfsrv_free_netopt_arg *)w;
2579	struct radix_node_head *rnh = fna->rnh;
2580	uint32_t *cnt = fna->cnt;
2581	struct nfs_netopt *nno = (struct nfs_netopt *)rn;
2582
2583	(*rnh->rnh_deladdr)(rn->rn_key, rn->rn_mask, rnh);
2584	if (IS_VALID_CRED(nno->no_opt.nxo_cred))
2585		kauth_cred_unref(&nno->no_opt.nxo_cred);
2586	_FREE((caddr_t)rn, M_NETADDR);
2587	*cnt -= 1;
2588	return (0);
2589}
2590
2591/*
2592 * Free the net address hash lists that are hanging off the mount points.
2593 */
2594int
2595nfsrv_free_addrlist(struct nfs_export *nx, struct user_nfs_export_args *unxa)
2596{
2597	struct nfs_export_net_args nxna;
2598	struct radix_node_head *rnh;
2599	struct radix_node *rn;
2600	struct nfsrv_free_netopt_arg fna;
2601	struct nfs_netopt *nno;
2602	user_addr_t uaddr;
2603	unsigned int net;
2604	int i, error;
2605
2606	if (!unxa || !unxa->nxa_netcount) {
2607		/* delete everything */
2608		for (i = 0; i <= AF_MAX; i++)
2609			if ( (rnh = nx->nx_rtable[i]) ) {
2610				fna.rnh = rnh;
2611				fna.cnt = &nx->nx_expcnt;
2612				(*rnh->rnh_walktree)(rnh, nfsrv_free_netopt, (caddr_t)&fna);
2613				_FREE((caddr_t)rnh, M_RTABLE);
2614				nx->nx_rtable[i] = 0;
2615			}
2616		return (0);
2617	}
2618
2619	/* delete only the exports specified */
2620	uaddr = unxa->nxa_nets;
2621	for (net = 0; net < unxa->nxa_netcount; net++, uaddr += sizeof(nxna)) {
2622		error = copyin(uaddr, &nxna, sizeof(nxna));
2623		if (error)
2624			return (error);
2625
2626		if (nxna.nxna_addr.ss_len == 0) {
2627			/* No address means this is a default/world export */
2628			if (nx->nx_flags & NX_DEFAULTEXPORT) {
2629				nx->nx_flags &= ~NX_DEFAULTEXPORT;
2630				if (IS_VALID_CRED(nx->nx_defopt.nxo_cred)) {
2631					kauth_cred_unref(&nx->nx_defopt.nxo_cred);
2632				}
2633				nx->nx_expcnt--;
2634			}
2635			continue;
2636		}
2637
2638		if ((rnh = nx->nx_rtable[nxna.nxna_addr.ss_family]) == 0) {
2639			/* AF not initialized? */
2640			if (!(unxa->nxa_flags & NXA_ADD))
2641				printf("nfsrv_free_addrlist: address not found (0)\n");
2642			continue;
2643		}
2644
2645		rn = (*rnh->rnh_lookup)(&nxna.nxna_addr,
2646			nxna.nxna_mask.ss_len ? &nxna.nxna_mask : NULL, rnh);
2647		if (!rn || (rn->rn_flags & RNF_ROOT)) {
2648			if (!(unxa->nxa_flags & NXA_ADD))
2649				printf("nfsrv_free_addrlist: address not found (1)\n");
2650			continue;
2651		}
2652
2653		(*rnh->rnh_deladdr)(rn->rn_key, rn->rn_mask, rnh);
2654		nno = (struct nfs_netopt *)rn;
2655		if (IS_VALID_CRED(nno->no_opt.nxo_cred))
2656			kauth_cred_unref(&nno->no_opt.nxo_cred);
2657		_FREE((caddr_t)rn, M_NETADDR);
2658
2659		nx->nx_expcnt--;
2660		if (nx->nx_expcnt == ((nx->nx_flags & NX_DEFAULTEXPORT) ? 1 : 0)) {
2661			/* no more entries in rnh, so free it up */
2662			_FREE((caddr_t)rnh, M_RTABLE);
2663			nx->nx_rtable[nxna.nxna_addr.ss_family] = 0;
2664		}
2665	}
2666
2667	return (0);
2668}
2669
2670void enablequotas(struct mount *mp, vfs_context_t ctx); // XXX
2671
2672int
2673nfsrv_export(struct user_nfs_export_args *unxa, vfs_context_t ctx)
2674{
2675	int error = 0;
2676	size_t pathlen;
2677	struct nfs_exportfs *nxfs, *nxfs2, *nxfs3;
2678	struct nfs_export *nx, *nx2, *nx3;
2679	struct nfs_filehandle nfh;
2680	struct nameidata mnd, xnd;
2681	vnode_t mvp = NULL, xvp = NULL;
2682	mount_t mp = NULL;
2683	char path[MAXPATHLEN];
2684	int expisroot;
2685
2686	if (unxa->nxa_flags == NXA_CHECK) {
2687		/* just check if the path is an NFS-exportable file system */
2688		error = copyinstr(unxa->nxa_fspath, path, MAXPATHLEN, &pathlen);
2689		if (error)
2690			return (error);
2691		NDINIT(&mnd, LOOKUP, OP_LOOKUP, FOLLOW | LOCKLEAF | AUDITVNPATH1,
2692			UIO_SYSSPACE, CAST_USER_ADDR_T(path), ctx);
2693		error = namei(&mnd);
2694		if (error)
2695			return (error);
2696		mvp = mnd.ni_vp;
2697		mp = vnode_mount(mvp);
2698		/* make sure it's the root of a file system */
2699		if (!vnode_isvroot(mvp))
2700			error = EINVAL;
2701		/* make sure the file system is NFS-exportable */
2702		if (!error) {
2703			nfh.nfh_len = NFSV3_MAX_FID_SIZE;
2704			error = VFS_VPTOFH(mvp, (int*)&nfh.nfh_len, &nfh.nfh_fid[0], NULL);
2705		}
2706		if (!error && (nfh.nfh_len > (int)NFSV3_MAX_FID_SIZE))
2707			error = EIO;
2708		if (!error && !(mp->mnt_vtable->vfc_vfsflags & VFC_VFSREADDIR_EXTENDED))
2709			error = EISDIR;
2710		vnode_put(mvp);
2711		nameidone(&mnd);
2712		return (error);
2713	}
2714
2715	/* all other operations: must be super user */
2716	if ((error = vfs_context_suser(ctx)))
2717		return (error);
2718
2719	if (unxa->nxa_flags & NXA_DELETE_ALL) {
2720		/* delete all exports on all file systems */
2721		lck_rw_lock_exclusive(&nfsrv_export_rwlock);
2722		while ((nxfs = LIST_FIRST(&nfsrv_exports))) {
2723			mp = vfs_getvfs_by_mntonname(nxfs->nxfs_path);
2724			if (mp) {
2725				vfs_clearflags(mp, MNT_EXPORTED);
2726				mount_iterdrop(mp);
2727				mp = NULL;
2728			}
2729			/* delete all exports on this file system */
2730			while ((nx = LIST_FIRST(&nxfs->nxfs_exports))) {
2731				LIST_REMOVE(nx, nx_next);
2732				LIST_REMOVE(nx, nx_hash);
2733				/* delete all netopts for this export */
2734				nfsrv_free_addrlist(nx, NULL);
2735				nx->nx_flags &= ~NX_DEFAULTEXPORT;
2736				if (IS_VALID_CRED(nx->nx_defopt.nxo_cred)) {
2737					kauth_cred_unref(&nx->nx_defopt.nxo_cred);
2738				}
2739				/* free active user list for this export */
2740				nfsrv_free_user_list(&nx->nx_user_list);
2741				FREE(nx->nx_path, M_TEMP);
2742				FREE(nx, M_TEMP);
2743			}
2744			LIST_REMOVE(nxfs, nxfs_next);
2745			FREE(nxfs->nxfs_path, M_TEMP);
2746			FREE(nxfs, M_TEMP);
2747		}
2748		if (nfsrv_export_hashtbl) {
2749			/* all exports deleted, clean up export hash table */
2750			FREE(nfsrv_export_hashtbl, M_TEMP);
2751			nfsrv_export_hashtbl = NULL;
2752		}
2753		lck_rw_done(&nfsrv_export_rwlock);
2754		return (0);
2755	}
2756
2757	error = copyinstr(unxa->nxa_fspath, path, MAXPATHLEN, &pathlen);
2758	if (error)
2759		return (error);
2760
2761	lck_rw_lock_exclusive(&nfsrv_export_rwlock);
2762
2763	/* init export hash table if not already */
2764	if (!nfsrv_export_hashtbl) {
2765		if (nfsrv_export_hash_size <= 0)
2766			nfsrv_export_hash_size = NFSRVEXPHASHSZ;
2767		nfsrv_export_hashtbl = hashinit(nfsrv_export_hash_size, M_TEMP, &nfsrv_export_hash);
2768	}
2769
2770	// first check if we've already got an exportfs with the given ID
2771	LIST_FOREACH(nxfs, &nfsrv_exports, nxfs_next) {
2772		if (nxfs->nxfs_id == unxa->nxa_fsid)
2773			break;
2774	}
2775	if (nxfs) {
2776		/* verify exported FS path matches given path */
2777		if (strncmp(path, nxfs->nxfs_path, MAXPATHLEN)) {
2778			error = EEXIST;
2779			goto unlock_out;
2780		}
2781		if ((unxa->nxa_flags & (NXA_ADD|NXA_OFFLINE)) == NXA_ADD) {
2782			/* if adding, verify that the mount is still what we expect */
2783			mp = vfs_getvfs_by_mntonname(nxfs->nxfs_path);
2784			if (mp) {
2785				mount_ref(mp, 0);
2786				mount_iterdrop(mp);
2787			}
2788			/* find exported FS root vnode */
2789			NDINIT(&mnd, LOOKUP, OP_LOOKUP, FOLLOW | LOCKLEAF | AUDITVNPATH1,
2790				UIO_SYSSPACE, CAST_USER_ADDR_T(nxfs->nxfs_path), ctx);
2791			error = namei(&mnd);
2792			if (error)
2793				goto unlock_out;
2794			mvp = mnd.ni_vp;
2795			/* make sure it's (still) the root of a file system */
2796			if (!vnode_isvroot(mvp)) {
2797				error = EINVAL;
2798				goto out;
2799			}
2800			/* sanity check: this should be same mount */
2801			if (mp != vnode_mount(mvp)) {
2802				error = EINVAL;
2803				goto out;
2804			}
2805		}
2806	} else {
2807		/* no current exported file system with that ID */
2808		if (!(unxa->nxa_flags & NXA_ADD)) {
2809			error = ENOENT;
2810			goto unlock_out;
2811		}
2812
2813		/* find exported FS root vnode */
2814		NDINIT(&mnd, LOOKUP, OP_LOOKUP, FOLLOW | LOCKLEAF | AUDITVNPATH1,
2815			UIO_SYSSPACE, CAST_USER_ADDR_T(path), ctx);
2816		error = namei(&mnd);
2817		if (error) {
2818			if (!(unxa->nxa_flags & NXA_OFFLINE))
2819				goto unlock_out;
2820		} else {
2821			mvp = mnd.ni_vp;
2822			/* make sure it's the root of a file system */
2823			if (!vnode_isvroot(mvp)) {
2824				/* bail if not marked offline */
2825				if (!(unxa->nxa_flags & NXA_OFFLINE)) {
2826					error = EINVAL;
2827					goto out;
2828				}
2829				vnode_put(mvp);
2830				nameidone(&mnd);
2831				mvp = NULL;
2832			} else {
2833				mp = vnode_mount(mvp);
2834				mount_ref(mp, 0);
2835
2836				/* make sure the file system is NFS-exportable */
2837				nfh.nfh_len = NFSV3_MAX_FID_SIZE;
2838				error = VFS_VPTOFH(mvp, (int*)&nfh.nfh_len, &nfh.nfh_fid[0], NULL);
2839				if (!error && (nfh.nfh_len > (int)NFSV3_MAX_FID_SIZE))
2840					error = EIO;
2841				if (!error && !(mp->mnt_vtable->vfc_vfsflags & VFC_VFSREADDIR_EXTENDED))
2842					error = EISDIR;
2843				if (error)
2844					goto out;
2845			}
2846		}
2847
2848		/* add an exportfs for it */
2849		MALLOC(nxfs, struct nfs_exportfs *, sizeof(struct nfs_exportfs), M_TEMP, M_WAITOK);
2850		if (!nxfs) {
2851			error = ENOMEM;
2852			goto out;
2853		}
2854		bzero(nxfs, sizeof(struct nfs_exportfs));
2855		nxfs->nxfs_id = unxa->nxa_fsid;
2856		MALLOC(nxfs->nxfs_path, char*, pathlen, M_TEMP, M_WAITOK);
2857		if (!nxfs->nxfs_path) {
2858			FREE(nxfs, M_TEMP);
2859			error = ENOMEM;
2860			goto out;
2861		}
2862		bcopy(path, nxfs->nxfs_path, pathlen);
2863		/* insert into list in reverse-sorted order */
2864		nxfs3 = NULL;
2865		LIST_FOREACH(nxfs2, &nfsrv_exports, nxfs_next) {
2866			if (strncmp(nxfs->nxfs_path, nxfs2->nxfs_path, MAXPATHLEN) > 0)
2867				break;
2868			nxfs3 = nxfs2;
2869		}
2870		if (nxfs2)
2871			LIST_INSERT_BEFORE(nxfs2, nxfs, nxfs_next);
2872		else if (nxfs3)
2873			LIST_INSERT_AFTER(nxfs3, nxfs, nxfs_next);
2874		else
2875			LIST_INSERT_HEAD(&nfsrv_exports, nxfs, nxfs_next);
2876
2877		/* make sure any quotas are enabled before we export the file system */
2878		if (mp)
2879			enablequotas(mp, ctx);
2880	}
2881
2882	if (unxa->nxa_exppath) {
2883		error = copyinstr(unxa->nxa_exppath, path, MAXPATHLEN, &pathlen);
2884		if (error)
2885			goto out;
2886		LIST_FOREACH(nx, &nxfs->nxfs_exports, nx_next) {
2887			if (nx->nx_id == unxa->nxa_expid)
2888				break;
2889		}
2890		if (nx) {
2891			/* verify exported FS path matches given path */
2892			if (strncmp(path, nx->nx_path, MAXPATHLEN)) {
2893				error = EEXIST;
2894				goto out;
2895			}
2896		} else {
2897			/* no current export with that ID */
2898			if (!(unxa->nxa_flags & NXA_ADD)) {
2899				error = ENOENT;
2900				goto out;
2901			}
2902			/* add an export for it */
2903			MALLOC(nx, struct nfs_export *, sizeof(struct nfs_export), M_TEMP, M_WAITOK);
2904			if (!nx) {
2905				error = ENOMEM;
2906				goto out1;
2907			}
2908			bzero(nx, sizeof(struct nfs_export));
2909			nx->nx_id = unxa->nxa_expid;
2910			nx->nx_fs = nxfs;
2911			microtime(&nx->nx_exptime);
2912			MALLOC(nx->nx_path, char*, pathlen, M_TEMP, M_WAITOK);
2913			if (!nx->nx_path) {
2914				error = ENOMEM;
2915				FREE(nx, M_TEMP);
2916				nx = NULL;
2917				goto out1;
2918			}
2919			bcopy(path, nx->nx_path, pathlen);
2920			/* initialize the active user list */
2921			nfsrv_init_user_list(&nx->nx_user_list);
2922			/* insert into list in reverse-sorted order */
2923			nx3 = NULL;
2924			LIST_FOREACH(nx2, &nxfs->nxfs_exports, nx_next) {
2925				if (strncmp(nx->nx_path, nx2->nx_path, MAXPATHLEN) > 0)
2926					break;
2927				nx3 = nx2;
2928			}
2929			if (nx2)
2930				LIST_INSERT_BEFORE(nx2, nx, nx_next);
2931			else if (nx3)
2932				LIST_INSERT_AFTER(nx3, nx, nx_next);
2933			else
2934				LIST_INSERT_HEAD(&nxfs->nxfs_exports, nx, nx_next);
2935			/* insert into hash */
2936			LIST_INSERT_HEAD(NFSRVEXPHASH(nxfs->nxfs_id, nx->nx_id), nx, nx_hash);
2937
2938			/*
2939			 * We don't allow/support nested exports.  Check if the new entry
2940			 * nests with the entries before and after or if there's an
2941			 * entry for the file system root and subdirs.
2942			 */
2943			error = 0;
2944			if ((nx3 && !strncmp(nx3->nx_path, nx->nx_path, pathlen - 1) &&
2945				    (nx3->nx_path[pathlen-1] == '/')) ||
2946			    (nx2 && !strncmp(nx2->nx_path, nx->nx_path, strlen(nx2->nx_path)) &&
2947			    	    (nx->nx_path[strlen(nx2->nx_path)] == '/')))
2948				error = EINVAL;
2949			if (!error) {
2950				/* check export conflict with fs root export and vice versa */
2951				expisroot = !nx->nx_path[0] ||
2952					    ((nx->nx_path[0] == '.') && !nx->nx_path[1]);
2953				LIST_FOREACH(nx2, &nxfs->nxfs_exports, nx_next) {
2954					if (expisroot) {
2955						if (nx2 != nx)
2956							break;
2957					} else if (!nx2->nx_path[0])
2958						break;
2959					else if ((nx2->nx_path[0] == '.') && !nx2->nx_path[1])
2960						break;
2961				}
2962				if (nx2)
2963					error = EINVAL;
2964			}
2965			if (error) {
2966				/*
2967				 * Don't actually return an error because mountd is
2968				 * probably about to delete the conflicting export.
2969				 * This can happen when a new export momentarily conflicts
2970				 * with an old export while the transition is being made.
2971				 * Theoretically, mountd could be written to avoid this
2972				 * transient situation - but it would greatly increase the
2973				 * complexity of mountd for very little overall benefit.
2974				 */
2975				printf("nfsrv_export: warning: nested exports: %s/%s\n",
2976					nxfs->nxfs_path, nx->nx_path);
2977				error = 0;
2978			}
2979			nx->nx_fh.nfh_xh.nxh_flags = NXHF_INVALIDFH;
2980		}
2981		/* make sure file handle is set up */
2982		if ((nx->nx_fh.nfh_xh.nxh_version != htonl(NFS_FH_VERSION)) ||
2983		    (nx->nx_fh.nfh_xh.nxh_flags & NXHF_INVALIDFH)) {
2984			/* try to set up export root file handle */
2985			nx->nx_fh.nfh_xh.nxh_version = htonl(NFS_FH_VERSION);
2986			nx->nx_fh.nfh_xh.nxh_fsid = htonl(nx->nx_fs->nxfs_id);
2987			nx->nx_fh.nfh_xh.nxh_expid = htonl(nx->nx_id);
2988			nx->nx_fh.nfh_xh.nxh_flags = 0;
2989			nx->nx_fh.nfh_xh.nxh_reserved = 0;
2990			nx->nx_fh.nfh_fhp = (u_char*)&nx->nx_fh.nfh_xh;
2991			bzero(&nx->nx_fh.nfh_fid[0], NFSV2_MAX_FID_SIZE);
2992			if (mvp) {
2993				/* find export root vnode */
2994				if (!nx->nx_path[0] || ((nx->nx_path[0] == '.') && !nx->nx_path[1])) {
2995					/* exporting file system's root directory */
2996					xvp = mvp;
2997					vnode_get(xvp);
2998				} else {
2999					xnd.ni_cnd.cn_nameiop = LOOKUP;
3000#if CONFIG_TRIGGERS
3001					xnd.ni_op = OP_LOOKUP;
3002#endif
3003					xnd.ni_cnd.cn_flags = LOCKLEAF;
3004					xnd.ni_pathlen = pathlen - 1;
3005					xnd.ni_cnd.cn_nameptr = xnd.ni_cnd.cn_pnbuf = path;
3006					xnd.ni_startdir = mvp;
3007					xnd.ni_usedvp   = mvp;
3008					xnd.ni_cnd.cn_context = ctx;
3009					while ((error = lookup(&xnd)) == ERECYCLE) {
3010						xnd.ni_cnd.cn_flags = LOCKLEAF;
3011						xnd.ni_cnd.cn_nameptr = xnd.ni_cnd.cn_pnbuf;
3012						xnd.ni_usedvp = xnd.ni_dvp = xnd.ni_startdir = mvp;
3013					}
3014					if (error)
3015						goto out1;
3016					xvp = xnd.ni_vp;
3017				}
3018
3019				if (vnode_vtype(xvp) != VDIR) {
3020					error = EINVAL;
3021					vnode_put(xvp);
3022					goto out1;
3023				}
3024
3025				/* grab file handle */
3026				nx->nx_fh.nfh_len = NFSV3_MAX_FID_SIZE;
3027				error = VFS_VPTOFH(xvp, (int*)&nx->nx_fh.nfh_len, &nx->nx_fh.nfh_fid[0], NULL);
3028				if (!error && (nx->nx_fh.nfh_len > (int)NFSV3_MAX_FID_SIZE)) {
3029					error = EIO;
3030				} else {
3031					nx->nx_fh.nfh_xh.nxh_fidlen = nx->nx_fh.nfh_len;
3032					nx->nx_fh.nfh_len += sizeof(nx->nx_fh.nfh_xh);
3033				}
3034
3035				vnode_put(xvp);
3036				if (error)
3037					goto out1;
3038			} else {
3039				nx->nx_fh.nfh_xh.nxh_flags = NXHF_INVALIDFH;
3040				nx->nx_fh.nfh_xh.nxh_fidlen = 0;
3041				nx->nx_fh.nfh_len = sizeof(nx->nx_fh.nfh_xh);
3042			}
3043		}
3044	} else {
3045		nx = NULL;
3046	}
3047
3048	/* perform the export changes */
3049	if (unxa->nxa_flags & NXA_DELETE) {
3050		if (!nx) {
3051			/* delete all exports on this file system */
3052			while ((nx = LIST_FIRST(&nxfs->nxfs_exports))) {
3053				LIST_REMOVE(nx, nx_next);
3054				LIST_REMOVE(nx, nx_hash);
3055				/* delete all netopts for this export */
3056				nfsrv_free_addrlist(nx, NULL);
3057				nx->nx_flags &= ~NX_DEFAULTEXPORT;
3058				if (IS_VALID_CRED(nx->nx_defopt.nxo_cred)) {
3059					kauth_cred_unref(&nx->nx_defopt.nxo_cred);
3060				}
3061				/* delete active user list for this export */
3062				nfsrv_free_user_list(&nx->nx_user_list);
3063				FREE(nx->nx_path, M_TEMP);
3064				FREE(nx, M_TEMP);
3065			}
3066			goto out1;
3067		} else if (!unxa->nxa_netcount) {
3068			/* delete all netopts for this export */
3069			nfsrv_free_addrlist(nx, NULL);
3070			nx->nx_flags &= ~NX_DEFAULTEXPORT;
3071			if (IS_VALID_CRED(nx->nx_defopt.nxo_cred)) {
3072				kauth_cred_unref(&nx->nx_defopt.nxo_cred);
3073			}
3074		} else {
3075			/* delete only the netopts for the given addresses */
3076			error = nfsrv_free_addrlist(nx, unxa);
3077			if (error)
3078				goto out1;
3079		}
3080	}
3081	if (unxa->nxa_flags & NXA_ADD) {
3082		/*
3083		 * If going offline set the export time so that when
3084		 * coming back on line we will present a new write verifier
3085		 * to the client.
3086		 */
3087		if (unxa->nxa_flags & NXA_OFFLINE)
3088			microtime(&nx->nx_exptime);
3089
3090		error = nfsrv_hang_addrlist(nx, unxa);
3091		if (!error && mp)
3092			vfs_setflags(mp, MNT_EXPORTED);
3093	}
3094
3095out1:
3096	if (nx && !nx->nx_expcnt) {
3097		/* export has no export options */
3098		LIST_REMOVE(nx, nx_next);
3099		LIST_REMOVE(nx, nx_hash);
3100		/* delete active user list for this export */
3101		nfsrv_free_user_list(&nx->nx_user_list);
3102		FREE(nx->nx_path, M_TEMP);
3103		FREE(nx, M_TEMP);
3104	}
3105	if (LIST_EMPTY(&nxfs->nxfs_exports)) {
3106		/* exported file system has no more exports */
3107		LIST_REMOVE(nxfs, nxfs_next);
3108		FREE(nxfs->nxfs_path, M_TEMP);
3109		FREE(nxfs, M_TEMP);
3110		if (mp)
3111			vfs_clearflags(mp, MNT_EXPORTED);
3112	}
3113
3114out:
3115	if (mvp) {
3116		vnode_put(mvp);
3117		nameidone(&mnd);
3118	}
3119unlock_out:
3120	if (mp)
3121		mount_drop(mp, 0);
3122	lck_rw_done(&nfsrv_export_rwlock);
3123	return (error);
3124}
3125
3126struct nfs_export_options *
3127nfsrv_export_lookup(struct nfs_export *nx, mbuf_t nam)
3128{
3129	struct nfs_export_options *nxo = NULL;
3130	struct nfs_netopt *no = NULL;
3131	struct radix_node_head *rnh;
3132	struct sockaddr *saddr;
3133
3134	/* Lookup in the export list first. */
3135	if (nam != NULL) {
3136		saddr = mbuf_data(nam);
3137		rnh = nx->nx_rtable[saddr->sa_family];
3138		if (rnh != NULL) {
3139			no = (struct nfs_netopt *)
3140				(*rnh->rnh_matchaddr)((caddr_t)saddr, rnh);
3141			if (no && no->no_rnodes->rn_flags & RNF_ROOT)
3142				no = NULL;
3143			if (no)
3144				nxo = &no->no_opt;
3145		}
3146	}
3147	/* If no address match, use the default if it exists. */
3148	if ((nxo == NULL) && (nx->nx_flags & NX_DEFAULTEXPORT))
3149		nxo = &nx->nx_defopt;
3150	return (nxo);
3151}
3152
3153/* find an export for the given handle */
3154struct nfs_export *
3155nfsrv_fhtoexport(struct nfs_filehandle *nfhp)
3156{
3157	struct nfs_exphandle *nxh = (struct nfs_exphandle*)nfhp->nfh_fhp;
3158	struct nfs_export *nx;
3159	uint32_t fsid, expid;
3160
3161	if (!nfsrv_export_hashtbl)
3162		return (NULL);
3163	fsid = ntohl(nxh->nxh_fsid);
3164	expid = ntohl(nxh->nxh_expid);
3165	nx = NFSRVEXPHASH(fsid, expid)->lh_first;
3166	for (; nx; nx = LIST_NEXT(nx, nx_hash)) {
3167		if (nx->nx_fs->nxfs_id != fsid)
3168			continue;
3169		if (nx->nx_id != expid)
3170			continue;
3171		break;
3172	}
3173	return (nx);
3174}
3175
3176/*
3177 * nfsrv_fhtovp() - convert FH to vnode and export info
3178 */
3179int
3180nfsrv_fhtovp(
3181	struct nfs_filehandle *nfhp,
3182	struct nfsrv_descript *nd,
3183	vnode_t *vpp,
3184	struct nfs_export **nxp,
3185	struct nfs_export_options **nxop)
3186{
3187	struct nfs_exphandle *nxh = (struct nfs_exphandle*)nfhp->nfh_fhp;
3188	struct nfs_export_options *nxo;
3189	u_char *fidp;
3190	int error;
3191	struct mount *mp;
3192	mbuf_t nam = NULL;
3193	uint32_t v;
3194	int i, valid;
3195
3196	*vpp = NULL;
3197	*nxp = NULL;
3198	*nxop = NULL;
3199
3200	if (nd != NULL)
3201		nam = nd->nd_nam;
3202
3203	v = ntohl(nxh->nxh_version);
3204	if (v != NFS_FH_VERSION) {
3205		/* file handle format not supported */
3206		return (ESTALE);
3207	}
3208	if (nfhp->nfh_len > NFSV3_MAX_FH_SIZE)
3209		return (EBADRPC);
3210	if (nfhp->nfh_len < (int)sizeof(struct nfs_exphandle))
3211		return (ESTALE);
3212	v = ntohs(nxh->nxh_flags);
3213	if (v & NXHF_INVALIDFH)
3214		return (ESTALE);
3215
3216	*nxp = nfsrv_fhtoexport(nfhp);
3217	if (!*nxp)
3218		return (ESTALE);
3219
3220	/* Get the export option structure for this <export, client> tuple. */
3221	*nxop = nxo = nfsrv_export_lookup(*nxp, nam);
3222	if (nam && (*nxop == NULL))
3223		return (EACCES);
3224
3225	if (nd != NULL) {
3226		/* Validate the security flavor of the request */
3227		for (i = 0, valid = 0; i < nxo->nxo_sec.count; i++) {
3228			if (nd->nd_sec == nxo->nxo_sec.flavors[i]) {
3229				valid = 1;
3230				break;
3231			}
3232		}
3233		if (!valid) {
3234			/*
3235			 * RFC 2623 section 2.3.2 recommends no authentication
3236			 * requirement for certain NFS procedures used for mounting.
3237			 * This allows an unauthenticated superuser on the client
3238			 * to do mounts for the benefit of authenticated users.
3239			 */
3240			if (nd->nd_vers == NFS_VER2)
3241				if (nd->nd_procnum == NFSV2PROC_GETATTR ||
3242				    nd->nd_procnum == NFSV2PROC_STATFS)
3243					valid = 1;
3244			if (nd->nd_vers == NFS_VER3)
3245				if (nd->nd_procnum == NFSPROC_FSINFO)
3246					valid = 1;
3247
3248			if (!valid)
3249				return (NFSERR_AUTHERR | AUTH_REJECTCRED);
3250		}
3251	}
3252
3253	if (nxo && (nxo->nxo_flags & NX_OFFLINE))
3254		return ((nd == NULL || nd->nd_vers == NFS_VER2) ? ESTALE : NFSERR_TRYLATER);
3255
3256	/* find mount structure */
3257	mp = vfs_getvfs_by_mntonname((*nxp)->nx_fs->nxfs_path);
3258	if (mp) {
3259		error = vfs_busy(mp, LK_NOWAIT);
3260		mount_iterdrop(mp);
3261		if (error)
3262			mp = NULL;
3263	}
3264	if (!mp) {
3265		/*
3266		 * We have an export, but no mount?
3267		 * Perhaps the export just hasn't been marked offline yet.
3268		 */
3269		return ((nd == NULL || nd->nd_vers == NFS_VER2) ? ESTALE : NFSERR_TRYLATER);
3270	}
3271
3272	fidp = nfhp->nfh_fhp + sizeof(*nxh);
3273	error = VFS_FHTOVP(mp, nxh->nxh_fidlen, fidp, vpp, NULL);
3274	vfs_unbusy(mp);
3275	if (error)
3276		return (error);
3277	/* vnode pointer should be good at this point or ... */
3278	if (*vpp == NULL)
3279		return (ESTALE);
3280	return (0);
3281}
3282
3283/*
3284 * nfsrv_credcheck() - check/map credentials according
3285 * to given export options.
3286 */
3287int
3288nfsrv_credcheck(
3289	struct nfsrv_descript *nd,
3290	vfs_context_t ctx,
3291	__unused struct nfs_export *nx,
3292	struct nfs_export_options *nxo)
3293{
3294	if (nxo && nxo->nxo_cred) {
3295		if ((nxo->nxo_flags & NX_MAPALL) ||
3296		    ((nxo->nxo_flags & NX_MAPROOT) && !suser(nd->nd_cr, NULL))) {
3297			kauth_cred_ref(nxo->nxo_cred);
3298			kauth_cred_unref(&nd->nd_cr);
3299			nd->nd_cr = nxo->nxo_cred;
3300		}
3301	}
3302	ctx->vc_ucred = nd->nd_cr;
3303	return (0);
3304}
3305
3306/*
3307 * nfsrv_vptofh() - convert vnode to file handle for given export
3308 *
3309 * If the caller is passing in a vnode for a ".." directory entry,
3310 * they can pass a directory NFS file handle (dnfhp) which will be
3311 * checked against the root export file handle.  If it matches, we
3312 * refuse to provide the file handle for the out-of-export directory.
3313 */
3314int
3315nfsrv_vptofh(
3316	struct nfs_export *nx,
3317	int nfsvers,
3318	struct nfs_filehandle *dnfhp,
3319	vnode_t vp,
3320	vfs_context_t ctx,
3321	struct nfs_filehandle *nfhp)
3322{
3323	int error;
3324	uint32_t maxfidsize;
3325
3326	nfhp->nfh_fhp = (u_char*)&nfhp->nfh_xh;
3327	nfhp->nfh_xh.nxh_version = htonl(NFS_FH_VERSION);
3328	nfhp->nfh_xh.nxh_fsid = htonl(nx->nx_fs->nxfs_id);
3329	nfhp->nfh_xh.nxh_expid = htonl(nx->nx_id);
3330	nfhp->nfh_xh.nxh_flags = 0;
3331	nfhp->nfh_xh.nxh_reserved = 0;
3332
3333	if (nfsvers == NFS_VER2)
3334		bzero(&nfhp->nfh_fid[0], NFSV2_MAX_FID_SIZE);
3335
3336	/* if directory FH matches export root, return invalid FH */
3337	if (dnfhp && nfsrv_fhmatch(dnfhp, &nx->nx_fh)) {
3338		if (nfsvers == NFS_VER2)
3339			nfhp->nfh_len = NFSX_V2FH;
3340		else
3341			nfhp->nfh_len = sizeof(nfhp->nfh_xh);
3342		nfhp->nfh_xh.nxh_fidlen = 0;
3343		nfhp->nfh_xh.nxh_flags = htons(NXHF_INVALIDFH);
3344		return (0);
3345	}
3346
3347	if (nfsvers == NFS_VER2)
3348		maxfidsize = NFSV2_MAX_FID_SIZE;
3349	else
3350		maxfidsize = NFSV3_MAX_FID_SIZE;
3351	nfhp->nfh_len = maxfidsize;
3352
3353	error = VFS_VPTOFH(vp, (int*)&nfhp->nfh_len, &nfhp->nfh_fid[0], ctx);
3354	if (error)
3355		return (error);
3356	if (nfhp->nfh_len > maxfidsize)
3357		return (EOVERFLOW);
3358	nfhp->nfh_xh.nxh_fidlen = nfhp->nfh_len;
3359	nfhp->nfh_len += sizeof(nfhp->nfh_xh);
3360	if ((nfsvers == NFS_VER2) && (nfhp->nfh_len < NFSX_V2FH))
3361		nfhp->nfh_len = NFSX_V2FH;
3362
3363	return (0);
3364}
3365
3366/*
3367 * Compare two file handles to see it they're the same.
3368 * Note that we don't use nfh_len because that may include
3369 * padding in an NFSv2 file handle.
3370 */
3371int
3372nfsrv_fhmatch(struct nfs_filehandle *fh1, struct nfs_filehandle *fh2)
3373{
3374	struct nfs_exphandle *nxh1, *nxh2;
3375	int len1, len2;
3376
3377	nxh1 = (struct nfs_exphandle *)fh1->nfh_fhp;
3378	nxh2 = (struct nfs_exphandle *)fh2->nfh_fhp;
3379	len1 = sizeof(fh1->nfh_xh) + nxh1->nxh_fidlen;
3380	len2 = sizeof(fh2->nfh_xh) + nxh2->nxh_fidlen;
3381	if (len1 != len2)
3382		return (0);
3383	if (bcmp(nxh1, nxh2, len1))
3384		return (0);
3385	return (1);
3386}
3387
3388/*
3389 * Functions for dealing with active user lists
3390 */
3391
3392/*
3393 * Search the hash table for a user node with a matching IP address and uid field.
3394 * If found, the node's tm_last timestamp is updated and the node is returned.
3395 *
3396 * If not found, a new node is allocated (or reclaimed via LRU), initialized, and returned.
3397 * Returns NULL if a new node could not be allcoated.
3398 *
3399 * The list's user_mutex lock MUST be held.
3400 */
3401struct nfs_user_stat_node *
3402nfsrv_get_user_stat_node(struct nfs_active_user_list *list, struct sockaddr *saddr, uid_t uid)
3403{
3404	struct nfs_user_stat_node		*unode;
3405	struct timeval				now;
3406	struct nfs_user_stat_hashtbl_head	*head;
3407
3408	/* seach the hash table */
3409	head = NFS_USER_STAT_HASH(list->user_hashtbl, uid);
3410	LIST_FOREACH(unode, head, hash_link) {
3411		if ((uid == unode->uid) && (nfs_sockaddr_cmp(saddr, (struct sockaddr*)&unode->sock) == 0)) {
3412			/* found matching node */
3413			break;
3414		}
3415	}
3416
3417	if (unode) {
3418		/* found node in the hash table, now update lru position */
3419		TAILQ_REMOVE(&list->user_lru, unode, lru_link);
3420		TAILQ_INSERT_TAIL(&list->user_lru, unode, lru_link);
3421
3422		/* update time stamp */
3423		microtime(&now);
3424		unode->tm_last = (uint32_t)now.tv_sec;
3425		return unode;
3426	}
3427
3428	if (list->node_count < nfsrv_user_stat_max_nodes) {
3429		/* Allocate a new node */
3430		MALLOC(unode, struct nfs_user_stat_node *, sizeof(struct nfs_user_stat_node),
3431			M_TEMP, M_WAITOK | M_ZERO);
3432
3433		if (!unode)
3434			return NULL;
3435
3436		/* increment node count */
3437		OSAddAtomic(1, &nfsrv_user_stat_node_count);
3438		list->node_count++;
3439	} else {
3440		/* reuse the oldest node in the lru list */
3441		unode = TAILQ_FIRST(&list->user_lru);
3442
3443		if (!unode)
3444			return NULL;
3445
3446		/* Remove the node */
3447		TAILQ_REMOVE(&list->user_lru, unode, lru_link);
3448		LIST_REMOVE(unode, hash_link);
3449	}
3450
3451	/* Initialize the node */
3452	unode->uid = uid;
3453	bcopy(saddr, &unode->sock, saddr->sa_len);
3454	microtime(&now);
3455	unode->ops = 0;
3456	unode->bytes_read = 0;
3457	unode->bytes_written = 0;
3458	unode->tm_start = (uint32_t)now.tv_sec;
3459	unode->tm_last = (uint32_t)now.tv_sec;
3460
3461	/* insert the node  */
3462	TAILQ_INSERT_TAIL(&list->user_lru, unode, lru_link);
3463	LIST_INSERT_HEAD(head, unode, hash_link);
3464
3465	return unode;
3466}
3467
3468void
3469nfsrv_update_user_stat(struct nfs_export *nx, struct nfsrv_descript *nd, uid_t uid, u_int ops, u_int rd_bytes, u_int wr_bytes)
3470{
3471	struct nfs_user_stat_node	*unode;
3472	struct nfs_active_user_list	*ulist;
3473	struct sockaddr			*saddr;
3474
3475	if ((!nfsrv_user_stat_enabled) || (!nx) || (!nd) || (!nd->nd_nam))
3476		return;
3477
3478	saddr = (struct sockaddr *)mbuf_data(nd->nd_nam);
3479
3480	/* check address family before going any further */
3481	if ((saddr->sa_family != AF_INET) && (saddr->sa_family != AF_INET6))
3482		return;
3483
3484	ulist = &nx->nx_user_list;
3485
3486	/* lock the active user list */
3487	lck_mtx_lock(&ulist->user_mutex);
3488
3489	/* get the user node */
3490	unode = nfsrv_get_user_stat_node(ulist, saddr, uid);
3491
3492	if (!unode) {
3493		lck_mtx_unlock(&ulist->user_mutex);
3494		return;
3495	}
3496
3497	/* update counters */
3498	unode->ops += ops;
3499	unode->bytes_read += rd_bytes;
3500	unode->bytes_written += wr_bytes;
3501
3502	/* done */
3503	lck_mtx_unlock(&ulist->user_mutex);
3504}
3505
3506/* initialize an active user list */
3507void
3508nfsrv_init_user_list(struct nfs_active_user_list *ulist)
3509{
3510	uint i;
3511
3512	/* initialize the lru */
3513	TAILQ_INIT(&ulist->user_lru);
3514
3515	/* initialize the hash table */
3516	for(i = 0; i < NFS_USER_STAT_HASH_SIZE; i++)
3517		LIST_INIT(&ulist->user_hashtbl[i]);
3518	ulist->node_count = 0;
3519
3520	lck_mtx_init(&ulist->user_mutex, nfsrv_active_user_mutex_group, LCK_ATTR_NULL);
3521}
3522
3523/* Free all nodes in an active user list */
3524void
3525nfsrv_free_user_list(struct nfs_active_user_list *ulist)
3526{
3527	struct nfs_user_stat_node *unode;
3528
3529	if (!ulist)
3530		return;
3531
3532	while ((unode = TAILQ_FIRST(&ulist->user_lru))) {
3533		/* Remove node and free */
3534		TAILQ_REMOVE(&ulist->user_lru, unode, lru_link);
3535		LIST_REMOVE(unode, hash_link);
3536		FREE(unode, M_TEMP);
3537
3538		/* decrement node count */
3539		OSAddAtomic(-1, &nfsrv_user_stat_node_count);
3540	}
3541	ulist->node_count = 0;
3542
3543	lck_mtx_destroy(&ulist->user_mutex, nfsrv_active_user_mutex_group);
3544}
3545
3546/* Reclaim old expired user nodes from active user lists. */
3547void
3548nfsrv_active_user_list_reclaim(void)
3549{
3550	struct nfs_exportfs			*nxfs;
3551	struct nfs_export			*nx;
3552	struct nfs_active_user_list		*ulist;
3553	struct nfs_user_stat_hashtbl_head	oldlist;
3554	struct nfs_user_stat_node		*unode, *unode_next;
3555	struct timeval				now;
3556	uint32_t				tstale;
3557
3558	LIST_INIT(&oldlist);
3559
3560	lck_rw_lock_shared(&nfsrv_export_rwlock);
3561	microtime(&now);
3562	tstale = now.tv_sec - nfsrv_user_stat_max_idle_sec;
3563	LIST_FOREACH(nxfs, &nfsrv_exports, nxfs_next) {
3564		LIST_FOREACH(nx, &nxfs->nxfs_exports, nx_next) {
3565			/* Scan through all user nodes of this export */
3566			ulist = &nx->nx_user_list;
3567			lck_mtx_lock(&ulist->user_mutex);
3568			for (unode = TAILQ_FIRST(&ulist->user_lru); unode; unode = unode_next) {
3569				unode_next = TAILQ_NEXT(unode, lru_link);
3570
3571				/* check if this node has expired */
3572				if (unode->tm_last >= tstale)
3573					break;
3574
3575				/* Remove node from the active user list */
3576				TAILQ_REMOVE(&ulist->user_lru, unode, lru_link);
3577				LIST_REMOVE(unode, hash_link);
3578
3579				/* Add node to temp list */
3580				LIST_INSERT_HEAD(&oldlist, unode, hash_link);
3581
3582				/* decrement node count */
3583				OSAddAtomic(-1, &nfsrv_user_stat_node_count);
3584				ulist->node_count--;
3585			}
3586			/* can unlock this export's list now */
3587			lck_mtx_unlock(&ulist->user_mutex);
3588		}
3589	}
3590        lck_rw_done(&nfsrv_export_rwlock);
3591
3592	/* Free expired nodes */
3593        while ((unode = LIST_FIRST(&oldlist))) {
3594		LIST_REMOVE(unode, hash_link);
3595		FREE(unode, M_TEMP);
3596	}
3597}
3598
3599/*
3600 * Maps errno values to nfs error numbers.
3601 * Use NFSERR_IO as the catch all for ones not specifically defined in
3602 * RFC 1094.
3603 */
3604static u_char nfsrv_v2errmap[] = {
3605  NFSERR_PERM,	NFSERR_NOENT,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3606  NFSERR_NXIO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3607  NFSERR_IO,	NFSERR_IO,	NFSERR_ACCES,	NFSERR_IO,	NFSERR_IO,
3608  NFSERR_IO,	NFSERR_EXIST,	NFSERR_IO,	NFSERR_NODEV,	NFSERR_NOTDIR,
3609  NFSERR_ISDIR,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3610  NFSERR_IO,	NFSERR_FBIG,	NFSERR_NOSPC,	NFSERR_IO,	NFSERR_ROFS,
3611  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3612  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3613  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3614  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3615  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3616  NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,	NFSERR_IO,
3617  NFSERR_IO,	NFSERR_IO,	NFSERR_NAMETOL,	NFSERR_IO,	NFSERR_IO,
3618  NFSERR_NOTEMPTY, NFSERR_IO,	NFSERR_IO,	NFSERR_DQUOT,	NFSERR_STALE,
3619};
3620
3621/*
3622 * Maps errno values to nfs error numbers.
3623 * Although it is not obvious whether or not NFS clients really care if
3624 * a returned error value is in the specified list for the procedure, the
3625 * safest thing to do is filter them appropriately. For Version 2, the
3626 * X/Open XNFS document is the only specification that defines error values
3627 * for each RPC (The RFC simply lists all possible error values for all RPCs),
3628 * so I have decided to not do this for Version 2.
3629 * The first entry is the default error return and the rest are the valid
3630 * errors for that RPC in increasing numeric order.
3631 */
3632static short nfsv3err_null[] = {
3633	0,
3634	0,
3635};
3636
3637static short nfsv3err_getattr[] = {
3638	NFSERR_IO,
3639	NFSERR_IO,
3640	NFSERR_STALE,
3641	NFSERR_BADHANDLE,
3642	NFSERR_SERVERFAULT,
3643	NFSERR_TRYLATER,
3644	0,
3645};
3646
3647static short nfsv3err_setattr[] = {
3648	NFSERR_IO,
3649	NFSERR_PERM,
3650	NFSERR_IO,
3651	NFSERR_ACCES,
3652	NFSERR_INVAL,
3653	NFSERR_NOSPC,
3654	NFSERR_ROFS,
3655	NFSERR_DQUOT,
3656	NFSERR_STALE,
3657	NFSERR_BADHANDLE,
3658	NFSERR_NOT_SYNC,
3659	NFSERR_SERVERFAULT,
3660	NFSERR_TRYLATER,
3661	0,
3662};
3663
3664static short nfsv3err_lookup[] = {
3665	NFSERR_IO,
3666	NFSERR_NOENT,
3667	NFSERR_IO,
3668	NFSERR_ACCES,
3669	NFSERR_NOTDIR,
3670	NFSERR_NAMETOL,
3671	NFSERR_STALE,
3672	NFSERR_BADHANDLE,
3673	NFSERR_SERVERFAULT,
3674	NFSERR_TRYLATER,
3675	0,
3676};
3677
3678static short nfsv3err_access[] = {
3679	NFSERR_IO,
3680	NFSERR_IO,
3681	NFSERR_STALE,
3682	NFSERR_BADHANDLE,
3683	NFSERR_SERVERFAULT,
3684	NFSERR_TRYLATER,
3685	0,
3686};
3687
3688static short nfsv3err_readlink[] = {
3689	NFSERR_IO,
3690	NFSERR_IO,
3691	NFSERR_ACCES,
3692	NFSERR_INVAL,
3693	NFSERR_STALE,
3694	NFSERR_BADHANDLE,
3695	NFSERR_NOTSUPP,
3696	NFSERR_SERVERFAULT,
3697	NFSERR_TRYLATER,
3698	0,
3699};
3700
3701static short nfsv3err_read[] = {
3702	NFSERR_IO,
3703	NFSERR_IO,
3704	NFSERR_NXIO,
3705	NFSERR_ACCES,
3706	NFSERR_INVAL,
3707	NFSERR_STALE,
3708	NFSERR_BADHANDLE,
3709	NFSERR_SERVERFAULT,
3710	NFSERR_TRYLATER,
3711	0,
3712};
3713
3714static short nfsv3err_write[] = {
3715	NFSERR_IO,
3716	NFSERR_IO,
3717	NFSERR_ACCES,
3718	NFSERR_INVAL,
3719	NFSERR_FBIG,
3720	NFSERR_NOSPC,
3721	NFSERR_ROFS,
3722	NFSERR_DQUOT,
3723	NFSERR_STALE,
3724	NFSERR_BADHANDLE,
3725	NFSERR_SERVERFAULT,
3726	NFSERR_TRYLATER,
3727	0,
3728};
3729
3730static short nfsv3err_create[] = {
3731	NFSERR_IO,
3732	NFSERR_IO,
3733	NFSERR_ACCES,
3734	NFSERR_EXIST,
3735	NFSERR_NOTDIR,
3736	NFSERR_NOSPC,
3737	NFSERR_ROFS,
3738	NFSERR_NAMETOL,
3739	NFSERR_DQUOT,
3740	NFSERR_STALE,
3741	NFSERR_BADHANDLE,
3742	NFSERR_NOTSUPP,
3743	NFSERR_SERVERFAULT,
3744	NFSERR_TRYLATER,
3745	0,
3746};
3747
3748static short nfsv3err_mkdir[] = {
3749	NFSERR_IO,
3750	NFSERR_IO,
3751	NFSERR_ACCES,
3752	NFSERR_EXIST,
3753	NFSERR_NOTDIR,
3754	NFSERR_NOSPC,
3755	NFSERR_ROFS,
3756	NFSERR_NAMETOL,
3757	NFSERR_DQUOT,
3758	NFSERR_STALE,
3759	NFSERR_BADHANDLE,
3760	NFSERR_NOTSUPP,
3761	NFSERR_SERVERFAULT,
3762	NFSERR_TRYLATER,
3763	0,
3764};
3765
3766static short nfsv3err_symlink[] = {
3767	NFSERR_IO,
3768	NFSERR_IO,
3769	NFSERR_ACCES,
3770	NFSERR_EXIST,
3771	NFSERR_NOTDIR,
3772	NFSERR_NOSPC,
3773	NFSERR_ROFS,
3774	NFSERR_NAMETOL,
3775	NFSERR_DQUOT,
3776	NFSERR_STALE,
3777	NFSERR_BADHANDLE,
3778	NFSERR_NOTSUPP,
3779	NFSERR_SERVERFAULT,
3780	NFSERR_TRYLATER,
3781	0,
3782};
3783
3784static short nfsv3err_mknod[] = {
3785	NFSERR_IO,
3786	NFSERR_IO,
3787	NFSERR_ACCES,
3788	NFSERR_EXIST,
3789	NFSERR_NOTDIR,
3790	NFSERR_NOSPC,
3791	NFSERR_ROFS,
3792	NFSERR_NAMETOL,
3793	NFSERR_DQUOT,
3794	NFSERR_STALE,
3795	NFSERR_BADHANDLE,
3796	NFSERR_NOTSUPP,
3797	NFSERR_SERVERFAULT,
3798	NFSERR_BADTYPE,
3799	NFSERR_TRYLATER,
3800	0,
3801};
3802
3803static short nfsv3err_remove[] = {
3804	NFSERR_IO,
3805	NFSERR_NOENT,
3806	NFSERR_IO,
3807	NFSERR_ACCES,
3808	NFSERR_NOTDIR,
3809	NFSERR_ROFS,
3810	NFSERR_NAMETOL,
3811	NFSERR_STALE,
3812	NFSERR_BADHANDLE,
3813	NFSERR_SERVERFAULT,
3814	NFSERR_TRYLATER,
3815	0,
3816};
3817
3818static short nfsv3err_rmdir[] = {
3819	NFSERR_IO,
3820	NFSERR_NOENT,
3821	NFSERR_IO,
3822	NFSERR_ACCES,
3823	NFSERR_EXIST,
3824	NFSERR_NOTDIR,
3825	NFSERR_INVAL,
3826	NFSERR_ROFS,
3827	NFSERR_NAMETOL,
3828	NFSERR_NOTEMPTY,
3829	NFSERR_STALE,
3830	NFSERR_BADHANDLE,
3831	NFSERR_NOTSUPP,
3832	NFSERR_SERVERFAULT,
3833	NFSERR_TRYLATER,
3834	0,
3835};
3836
3837static short nfsv3err_rename[] = {
3838	NFSERR_IO,
3839	NFSERR_NOENT,
3840	NFSERR_IO,
3841	NFSERR_ACCES,
3842	NFSERR_EXIST,
3843	NFSERR_XDEV,
3844	NFSERR_NOTDIR,
3845	NFSERR_ISDIR,
3846	NFSERR_INVAL,
3847	NFSERR_NOSPC,
3848	NFSERR_ROFS,
3849	NFSERR_MLINK,
3850	NFSERR_NAMETOL,
3851	NFSERR_NOTEMPTY,
3852	NFSERR_DQUOT,
3853	NFSERR_STALE,
3854	NFSERR_BADHANDLE,
3855	NFSERR_NOTSUPP,
3856	NFSERR_SERVERFAULT,
3857	NFSERR_TRYLATER,
3858	0,
3859};
3860
3861static short nfsv3err_link[] = {
3862	NFSERR_IO,
3863	NFSERR_IO,
3864	NFSERR_ACCES,
3865	NFSERR_EXIST,
3866	NFSERR_XDEV,
3867	NFSERR_NOTDIR,
3868	NFSERR_INVAL,
3869	NFSERR_NOSPC,
3870	NFSERR_ROFS,
3871	NFSERR_MLINK,
3872	NFSERR_NAMETOL,
3873	NFSERR_DQUOT,
3874	NFSERR_STALE,
3875	NFSERR_BADHANDLE,
3876	NFSERR_NOTSUPP,
3877	NFSERR_SERVERFAULT,
3878	NFSERR_TRYLATER,
3879	0,
3880};
3881
3882static short nfsv3err_readdir[] = {
3883	NFSERR_IO,
3884	NFSERR_IO,
3885	NFSERR_ACCES,
3886	NFSERR_NOTDIR,
3887	NFSERR_STALE,
3888	NFSERR_BADHANDLE,
3889	NFSERR_BAD_COOKIE,
3890	NFSERR_TOOSMALL,
3891	NFSERR_SERVERFAULT,
3892	NFSERR_TRYLATER,
3893	0,
3894};
3895
3896static short nfsv3err_readdirplus[] = {
3897	NFSERR_IO,
3898	NFSERR_IO,
3899	NFSERR_ACCES,
3900	NFSERR_NOTDIR,
3901	NFSERR_STALE,
3902	NFSERR_BADHANDLE,
3903	NFSERR_BAD_COOKIE,
3904	NFSERR_NOTSUPP,
3905	NFSERR_TOOSMALL,
3906	NFSERR_SERVERFAULT,
3907	NFSERR_TRYLATER,
3908	0,
3909};
3910
3911static short nfsv3err_fsstat[] = {
3912	NFSERR_IO,
3913	NFSERR_IO,
3914	NFSERR_STALE,
3915	NFSERR_BADHANDLE,
3916	NFSERR_SERVERFAULT,
3917	NFSERR_TRYLATER,
3918	0,
3919};
3920
3921static short nfsv3err_fsinfo[] = {
3922	NFSERR_STALE,
3923	NFSERR_STALE,
3924	NFSERR_BADHANDLE,
3925	NFSERR_SERVERFAULT,
3926	NFSERR_TRYLATER,
3927	0,
3928};
3929
3930static short nfsv3err_pathconf[] = {
3931	NFSERR_STALE,
3932	NFSERR_STALE,
3933	NFSERR_BADHANDLE,
3934	NFSERR_SERVERFAULT,
3935	NFSERR_TRYLATER,
3936	0,
3937};
3938
3939static short nfsv3err_commit[] = {
3940	NFSERR_IO,
3941	NFSERR_IO,
3942	NFSERR_STALE,
3943	NFSERR_BADHANDLE,
3944	NFSERR_SERVERFAULT,
3945	NFSERR_TRYLATER,
3946	0,
3947};
3948
3949static short *nfsrv_v3errmap[] = {
3950	nfsv3err_null,
3951	nfsv3err_getattr,
3952	nfsv3err_setattr,
3953	nfsv3err_lookup,
3954	nfsv3err_access,
3955	nfsv3err_readlink,
3956	nfsv3err_read,
3957	nfsv3err_write,
3958	nfsv3err_create,
3959	nfsv3err_mkdir,
3960	nfsv3err_symlink,
3961	nfsv3err_mknod,
3962	nfsv3err_remove,
3963	nfsv3err_rmdir,
3964	nfsv3err_rename,
3965	nfsv3err_link,
3966	nfsv3err_readdir,
3967	nfsv3err_readdirplus,
3968	nfsv3err_fsstat,
3969	nfsv3err_fsinfo,
3970	nfsv3err_pathconf,
3971	nfsv3err_commit,
3972};
3973
3974/*
3975 * Map errnos to NFS error numbers. For Version 3 also filter out error
3976 * numbers not specified for the associated procedure.
3977 */
3978int
3979nfsrv_errmap(struct nfsrv_descript *nd, int err)
3980{
3981	short *defaulterrp, *errp;
3982
3983	if (nd->nd_vers == NFS_VER2) {
3984		if (err <= (int)sizeof(nfsrv_v2errmap))
3985			return ((int)nfsrv_v2errmap[err - 1]);
3986		return (NFSERR_IO);
3987	}
3988	/* NFSv3 */
3989	if (nd->nd_procnum > NFSPROC_COMMIT)
3990		return (err & 0xffff);
3991	errp = defaulterrp = nfsrv_v3errmap[nd->nd_procnum];
3992	while (*++errp) {
3993		if (*errp == err)
3994			return (err);
3995		else if (*errp > err)
3996			break;
3997	}
3998	return ((int)*defaulterrp);
3999}
4000
4001#endif /* NFSSERVER */
4002
4003