autofs_vnops.c revision 296937
1/*-
2 * Copyright (c) 2014 The FreeBSD Foundation
3 * All rights reserved.
4 *
5 * This software was developed by Edward Tomasz Napierala under sponsorship
6 * from the FreeBSD Foundation.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 */
30
31#include <sys/cdefs.h>
32__FBSDID("$FreeBSD: head/sys/fs/autofs/autofs_vnops.c 296937 2016-03-16 14:00:45Z trasz $");
33
34#include <sys/param.h>
35#include <sys/kernel.h>
36#include <sys/condvar.h>
37#include <sys/dirent.h>
38#include <sys/fcntl.h>
39#include <sys/lock.h>
40#include <sys/mount.h>
41#include <sys/mutex.h>
42#include <sys/namei.h>
43#include <sys/signalvar.h>
44#include <sys/stat.h>
45#include <sys/systm.h>
46#include <sys/taskqueue.h>
47#include <sys/vnode.h>
48#include <machine/atomic.h>
49#include <vm/uma.h>
50
51#include <fs/autofs/autofs.h>
52
53static int	autofs_trigger_vn(struct vnode *vp, const char *path,
54		    int pathlen, struct vnode **newvp);
55
56extern struct autofs_softc	*autofs_softc;
57
58static int
59autofs_access(struct vop_access_args *ap)
60{
61
62	/*
63	 * Nothing to do here; the only kind of access control
64	 * needed is in autofs_mkdir().
65	 */
66
67	return (0);
68}
69
70static int
71autofs_getattr(struct vop_getattr_args *ap)
72{
73	struct vnode *vp, *newvp;
74	struct autofs_node *anp;
75	struct mount *mp;
76	struct vattr *vap;
77	int error;
78
79	vp = ap->a_vp;
80	anp = vp->v_data;
81	mp = vp->v_mount;
82	vap = ap->a_vap;
83
84	KASSERT(ap->a_vp->v_type == VDIR, ("!VDIR"));
85
86	/*
87	 * The reason we must do this is that some tree-walking software,
88	 * namely fts(3), assumes that stat(".") results will not change
89	 * between chdir("subdir") and chdir(".."), and fails with ENOENT
90	 * otherwise.
91	 */
92	if (autofs_mount_on_stat && autofs_cached(anp, NULL, 0) == false &&
93	    autofs_ignore_thread(curthread) == false) {
94		error = autofs_trigger_vn(vp, "", 0, &newvp);
95		if (error != 0)
96			return (error);
97
98		if (newvp != NULL) {
99			error = VOP_GETATTR(newvp, ap->a_vap,
100			    ap->a_cred);
101			vput(newvp);
102			return (error);
103		}
104	}
105
106	vap->va_type = VDIR;
107	vap->va_mode = 0755;
108	vap->va_nlink = 3; /* XXX */
109	vap->va_uid = 0;
110	vap->va_gid = 0;
111	vap->va_rdev = NODEV;
112	vap->va_fsid = mp->mnt_stat.f_fsid.val[0];
113	vap->va_fileid = anp->an_fileno;
114	vap->va_size = S_BLKSIZE;
115	vap->va_blocksize = S_BLKSIZE;
116	vap->va_mtime = anp->an_ctime;
117	vap->va_atime = anp->an_ctime;
118	vap->va_ctime = anp->an_ctime;
119	vap->va_birthtime = anp->an_ctime;
120	vap->va_gen = 0;
121	vap->va_flags = 0;
122	vap->va_rdev = 0;
123	vap->va_bytes = S_BLKSIZE;
124	vap->va_filerev = 0;
125	vap->va_spare = 0;
126
127	return (0);
128}
129
130/*
131 * Unlock the vnode, request automountd(8) action, and then lock it back.
132 * If anything got mounted on top of the vnode, return the new filesystem's
133 * root vnode in 'newvp', locked.
134 */
135static int
136autofs_trigger_vn(struct vnode *vp, const char *path, int pathlen,
137    struct vnode **newvp)
138{
139	struct autofs_node *anp;
140	struct autofs_mount *amp;
141	int error, lock_flags;
142
143	anp = vp->v_data;
144	amp = VFSTOAUTOFS(vp->v_mount);
145
146	/*
147	 * Release the vnode lock, so that other operations, in partcular
148	 * mounting a filesystem on top of it, can proceed.  Increase use
149	 * count, to prevent the vnode from being deallocated and to prevent
150	 * filesystem from being unmounted.
151	 */
152	lock_flags = VOP_ISLOCKED(vp);
153	vref(vp);
154	VOP_UNLOCK(vp, 0);
155
156	sx_xlock(&autofs_softc->sc_lock);
157
158	/*
159	 * XXX: Workaround for mounting the same thing multiple times; revisit.
160	 */
161	if (vp->v_mountedhere != NULL) {
162		error = 0;
163		goto mounted;
164	}
165
166	error = autofs_trigger(anp, path, pathlen);
167mounted:
168	sx_xunlock(&autofs_softc->sc_lock);
169	vn_lock(vp, lock_flags | LK_RETRY);
170	vunref(vp);
171	if ((vp->v_iflag & VI_DOOMED) != 0) {
172		AUTOFS_DEBUG("VI_DOOMED");
173		return (ENOENT);
174	}
175
176	if (error != 0)
177		return (error);
178
179	if (vp->v_mountedhere == NULL) {
180		*newvp = NULL;
181		return (0);
182	} else {
183		/*
184		 * If the operation that succeeded was mount, then mark
185		 * the node as non-cached.  Otherwise, if someone unmounts
186		 * the filesystem before the cache times out, we will fail
187		 * to trigger.
188		 */
189		anp->an_cached = false;
190	}
191
192	error = VFS_ROOT(vp->v_mountedhere, lock_flags, newvp);
193	if (error != 0) {
194		AUTOFS_WARN("VFS_ROOT() failed with error %d", error);
195		return (error);
196	}
197
198	return (0);
199}
200
201static int
202autofs_vget_callback(struct mount *mp, void *arg, int flags,
203    struct vnode **vpp)
204{
205
206
207	return (autofs_node_vn(arg, mp, flags, vpp));
208}
209
210static int
211autofs_lookup(struct vop_lookup_args *ap)
212{
213	struct vnode *dvp, *newvp, **vpp;
214	struct mount *mp;
215	struct autofs_mount *amp;
216	struct autofs_node *anp, *child;
217	struct componentname *cnp;
218	int error;
219
220	dvp = ap->a_dvp;
221	vpp = ap->a_vpp;
222	mp = dvp->v_mount;
223	amp = VFSTOAUTOFS(mp);
224	anp = dvp->v_data;
225	cnp = ap->a_cnp;
226
227	if (cnp->cn_flags & ISDOTDOT) {
228		KASSERT(anp->an_parent != NULL, ("NULL parent"));
229		/*
230		 * Note that in this case, dvp is the child vnode, and we
231		 * are looking up the parent vnode - exactly reverse from
232		 * normal operation.  Unlocking dvp requires some rather
233		 * tricky unlock/relock dance to prevent mp from being freed;
234		 * use vn_vget_ino_gen() which takes care of all that.
235		 */
236		error = vn_vget_ino_gen(dvp, autofs_vget_callback,
237		    anp->an_parent, cnp->cn_lkflags, vpp);
238		if (error != 0) {
239			AUTOFS_WARN("vn_vget_ino_gen() failed with error %d",
240			    error);
241			return (error);
242		}
243		return (error);
244	}
245
246	if (cnp->cn_namelen == 1 && cnp->cn_nameptr[0] == '.') {
247		vref(dvp);
248		*vpp = dvp;
249
250		return (0);
251	}
252
253	if (autofs_cached(anp, cnp->cn_nameptr, cnp->cn_namelen) == false &&
254	    autofs_ignore_thread(cnp->cn_thread) == false) {
255		error = autofs_trigger_vn(dvp,
256		    cnp->cn_nameptr, cnp->cn_namelen, &newvp);
257		if (error != 0)
258			return (error);
259
260		if (newvp != NULL) {
261			/*
262			 * The target filesystem got automounted.
263			 * Let the lookup(9) go around with the same
264			 * path component.
265			 */
266			vput(newvp);
267			return (ERELOOKUP);
268		}
269	}
270
271	AUTOFS_SLOCK(amp);
272	error = autofs_node_find(anp, cnp->cn_nameptr, cnp->cn_namelen, &child);
273	if (error != 0) {
274		if ((cnp->cn_flags & ISLASTCN) && cnp->cn_nameiop == CREATE) {
275			AUTOFS_SUNLOCK(amp);
276			return (EJUSTRETURN);
277		}
278
279		AUTOFS_SUNLOCK(amp);
280		return (ENOENT);
281	}
282
283	/*
284	 * XXX: Dropping the node here is ok, because we never remove nodes.
285	 */
286	AUTOFS_SUNLOCK(amp);
287
288	error = autofs_node_vn(child, mp, cnp->cn_lkflags, vpp);
289	if (error != 0) {
290		if ((cnp->cn_flags & ISLASTCN) && cnp->cn_nameiop == CREATE)
291			return (EJUSTRETURN);
292
293		return (error);
294	}
295
296	return (0);
297}
298
299static int
300autofs_mkdir(struct vop_mkdir_args *ap)
301{
302	struct vnode *vp;
303	struct autofs_node *anp;
304	struct autofs_mount *amp;
305	struct autofs_node *child;
306	int error;
307
308	vp = ap->a_dvp;
309	anp = vp->v_data;
310	amp = VFSTOAUTOFS(vp->v_mount);
311
312	/*
313	 * Do not allow mkdir() if the calling thread is not
314	 * automountd(8) descendant.
315	 */
316	if (autofs_ignore_thread(curthread) == false)
317		return (EPERM);
318
319	AUTOFS_XLOCK(amp);
320	error = autofs_node_new(anp, amp, ap->a_cnp->cn_nameptr,
321	    ap->a_cnp->cn_namelen, &child);
322	if (error != 0) {
323		AUTOFS_XUNLOCK(amp);
324		return (error);
325	}
326	AUTOFS_XUNLOCK(amp);
327
328	error = autofs_node_vn(child, vp->v_mount, LK_EXCLUSIVE, ap->a_vpp);
329
330	return (error);
331}
332
333/*
334 * Write out a single 'struct dirent', based on 'name' and 'fileno' arguments.
335 */
336static int
337autofs_readdir_one(struct uio *uio, const char *name, int fileno,
338    size_t *reclenp)
339{
340	struct dirent dirent;
341	size_t namlen, padded_namlen, reclen;
342	int error;
343
344	namlen = strlen(name);
345	padded_namlen = roundup2(namlen + 1, __alignof(struct dirent));
346	KASSERT(padded_namlen <= MAXNAMLEN, ("%zd > MAXNAMLEN", padded_namlen));
347	reclen = offsetof(struct dirent, d_name) + padded_namlen;
348
349	if (reclenp != NULL)
350		*reclenp = reclen;
351
352	if (uio == NULL)
353		return (0);
354
355	if (uio->uio_resid < reclen)
356		return (EINVAL);
357
358	dirent.d_fileno = fileno;
359	dirent.d_reclen = reclen;
360	dirent.d_type = DT_DIR;
361	dirent.d_namlen = namlen;
362	memcpy(dirent.d_name, name, namlen);
363	memset(dirent.d_name + namlen, 0, padded_namlen - namlen);
364	error = uiomove(&dirent, reclen, uio);
365
366	return (error);
367}
368
369static size_t
370autofs_dirent_reclen(const char *name)
371{
372	size_t reclen;
373
374	(void)autofs_readdir_one(NULL, name, -1, &reclen);
375
376	return (reclen);
377}
378
379static int
380autofs_readdir(struct vop_readdir_args *ap)
381{
382	struct vnode *vp, *newvp;
383	struct autofs_mount *amp;
384	struct autofs_node *anp, *child;
385	struct uio *uio;
386	size_t reclen, reclens;
387	ssize_t initial_resid;
388	int error;
389
390	vp = ap->a_vp;
391	amp = VFSTOAUTOFS(vp->v_mount);
392	anp = vp->v_data;
393	uio = ap->a_uio;
394	initial_resid = ap->a_uio->uio_resid;
395
396	KASSERT(vp->v_type == VDIR, ("!VDIR"));
397
398	if (autofs_cached(anp, NULL, 0) == false &&
399	    autofs_ignore_thread(curthread) == false) {
400		error = autofs_trigger_vn(vp, "", 0, &newvp);
401		if (error != 0)
402			return (error);
403
404		if (newvp != NULL) {
405			error = VOP_READDIR(newvp, ap->a_uio, ap->a_cred,
406			    ap->a_eofflag, ap->a_ncookies, ap->a_cookies);
407			vput(newvp);
408			return (error);
409		}
410	}
411
412	if (uio->uio_offset < 0)
413		return (EINVAL);
414
415	if (ap->a_eofflag != NULL)
416		*ap->a_eofflag = FALSE;
417
418	/*
419	 * Write out the directory entry for ".".  This is conditional
420	 * on the current offset into the directory; same applies to the
421	 * other two cases below.
422	 */
423	if (uio->uio_offset == 0) {
424		error = autofs_readdir_one(uio, ".", anp->an_fileno, &reclen);
425		if (error != 0)
426			goto out;
427	}
428	reclens = autofs_dirent_reclen(".");
429
430	/*
431	 * Write out the directory entry for "..".
432	 */
433	if (uio->uio_offset <= reclens) {
434		if (uio->uio_offset != reclens)
435			return (EINVAL);
436		if (anp->an_parent == NULL) {
437			error = autofs_readdir_one(uio, "..",
438			    anp->an_fileno, &reclen);
439		} else {
440			error = autofs_readdir_one(uio, "..",
441			    anp->an_parent->an_fileno, &reclen);
442		}
443		if (error != 0)
444			goto out;
445	}
446
447	reclens += autofs_dirent_reclen("..");
448
449	/*
450	 * Write out the directory entries for subdirectories.
451	 */
452	AUTOFS_SLOCK(amp);
453	TAILQ_FOREACH(child, &anp->an_children, an_next) {
454		/*
455		 * Check the offset to skip entries returned by previous
456		 * calls to getdents().
457		 */
458		if (uio->uio_offset > reclens) {
459			reclens += autofs_dirent_reclen(child->an_name);
460			continue;
461		}
462
463		/*
464		 * Prevent seeking into the middle of dirent.
465		 */
466		if (uio->uio_offset != reclens) {
467			AUTOFS_SUNLOCK(amp);
468			return (EINVAL);
469		}
470
471		error = autofs_readdir_one(uio, child->an_name,
472		    child->an_fileno, &reclen);
473		reclens += reclen;
474		if (error != 0) {
475			AUTOFS_SUNLOCK(amp);
476			goto out;
477		}
478	}
479	AUTOFS_SUNLOCK(amp);
480
481	if (ap->a_eofflag != NULL)
482		*ap->a_eofflag = TRUE;
483
484	return (0);
485
486out:
487	/*
488	 * Return error if the initial buffer was too small to do anything.
489	 */
490	if (uio->uio_resid == initial_resid)
491		return (error);
492
493	/*
494	 * Don't return an error if we managed to copy out some entries.
495	 */
496	if (uio->uio_resid < reclen)
497		return (0);
498
499	return (error);
500}
501
502static int
503autofs_reclaim(struct vop_reclaim_args *ap)
504{
505	struct vnode *vp;
506	struct autofs_node *anp;
507
508	vp = ap->a_vp;
509	anp = vp->v_data;
510
511	/*
512	 * We do not free autofs_node here; instead we are
513	 * destroying them in autofs_node_delete().
514	 */
515	sx_xlock(&anp->an_vnode_lock);
516	anp->an_vnode = NULL;
517	vp->v_data = NULL;
518	sx_xunlock(&anp->an_vnode_lock);
519
520	return (0);
521}
522
523struct vop_vector autofs_vnodeops = {
524	.vop_default =		&default_vnodeops,
525
526	.vop_access =		autofs_access,
527	.vop_lookup =		autofs_lookup,
528	.vop_create =		VOP_EOPNOTSUPP,
529	.vop_getattr =		autofs_getattr,
530	.vop_link =		VOP_EOPNOTSUPP,
531	.vop_mkdir =		autofs_mkdir,
532	.vop_mknod =		VOP_EOPNOTSUPP,
533	.vop_read =		VOP_EOPNOTSUPP,
534	.vop_readdir =		autofs_readdir,
535	.vop_remove =		VOP_EOPNOTSUPP,
536	.vop_rename =		VOP_EOPNOTSUPP,
537	.vop_rmdir =		VOP_EOPNOTSUPP,
538	.vop_setattr =		VOP_EOPNOTSUPP,
539	.vop_symlink =		VOP_EOPNOTSUPP,
540	.vop_write =		VOP_EOPNOTSUPP,
541	.vop_reclaim =		autofs_reclaim,
542};
543
544int
545autofs_node_new(struct autofs_node *parent, struct autofs_mount *amp,
546    const char *name, int namelen, struct autofs_node **anpp)
547{
548	struct autofs_node *anp;
549
550	if (parent != NULL) {
551		AUTOFS_ASSERT_XLOCKED(parent->an_mount);
552
553		KASSERT(autofs_node_find(parent, name, namelen, NULL) == ENOENT,
554		    ("node \"%s\" already exists", name));
555	}
556
557	anp = uma_zalloc(autofs_node_zone, M_WAITOK | M_ZERO);
558	if (namelen >= 0)
559		anp->an_name = strndup(name, namelen, M_AUTOFS);
560	else
561		anp->an_name = strdup(name, M_AUTOFS);
562	anp->an_fileno = atomic_fetchadd_int(&amp->am_last_fileno, 1);
563	callout_init(&anp->an_callout, 1);
564	/*
565	 * The reason for SX_NOWITNESS here is that witness(4)
566	 * cannot tell vnodes apart, so the following perfectly
567	 * valid lock order...
568	 *
569	 * vnode lock A -> autofsvlk B -> vnode lock B
570	 *
571	 * ... gets reported as a LOR.
572	 */
573	sx_init_flags(&anp->an_vnode_lock, "autofsvlk", SX_NOWITNESS);
574	getnanotime(&anp->an_ctime);
575	anp->an_parent = parent;
576	anp->an_mount = amp;
577	if (parent != NULL)
578		TAILQ_INSERT_TAIL(&parent->an_children, anp, an_next);
579	TAILQ_INIT(&anp->an_children);
580
581	*anpp = anp;
582	return (0);
583}
584
585int
586autofs_node_find(struct autofs_node *parent, const char *name,
587    int namelen, struct autofs_node **anpp)
588{
589	struct autofs_node *anp;
590
591	AUTOFS_ASSERT_LOCKED(parent->an_mount);
592
593	TAILQ_FOREACH(anp, &parent->an_children, an_next) {
594		if (namelen >= 0) {
595			if (strlen(anp->an_name) != namelen)
596				continue;
597			if (strncmp(anp->an_name, name, namelen) != 0)
598				continue;
599		} else {
600			if (strcmp(anp->an_name, name) != 0)
601				continue;
602		}
603
604		if (anpp != NULL)
605			*anpp = anp;
606		return (0);
607	}
608
609	return (ENOENT);
610}
611
612void
613autofs_node_delete(struct autofs_node *anp)
614{
615	struct autofs_node *parent;
616
617	AUTOFS_ASSERT_XLOCKED(anp->an_mount);
618	KASSERT(TAILQ_EMPTY(&anp->an_children), ("have children"));
619
620	callout_drain(&anp->an_callout);
621
622	parent = anp->an_parent;
623	if (parent != NULL)
624		TAILQ_REMOVE(&parent->an_children, anp, an_next);
625	sx_destroy(&anp->an_vnode_lock);
626	free(anp->an_name, M_AUTOFS);
627	uma_zfree(autofs_node_zone, anp);
628}
629
630int
631autofs_node_vn(struct autofs_node *anp, struct mount *mp, int flags,
632    struct vnode **vpp)
633{
634	struct vnode *vp;
635	int error;
636
637	AUTOFS_ASSERT_UNLOCKED(anp->an_mount);
638
639	sx_xlock(&anp->an_vnode_lock);
640
641	vp = anp->an_vnode;
642	if (vp != NULL) {
643		error = vget(vp, flags | LK_RETRY, curthread);
644		if (error != 0) {
645			AUTOFS_WARN("vget failed with error %d", error);
646			sx_xunlock(&anp->an_vnode_lock);
647			return (error);
648		}
649		if (vp->v_iflag & VI_DOOMED) {
650			/*
651			 * We got forcibly unmounted.
652			 */
653			AUTOFS_DEBUG("doomed vnode");
654			sx_xunlock(&anp->an_vnode_lock);
655			vput(vp);
656
657			return (ENOENT);
658		}
659
660		*vpp = vp;
661		sx_xunlock(&anp->an_vnode_lock);
662		return (0);
663	}
664
665	error = getnewvnode("autofs", mp, &autofs_vnodeops, &vp);
666	if (error != 0) {
667		sx_xunlock(&anp->an_vnode_lock);
668		return (error);
669	}
670
671	error = vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
672	if (error != 0) {
673		sx_xunlock(&anp->an_vnode_lock);
674		vdrop(vp);
675		return (error);
676	}
677
678	vp->v_type = VDIR;
679	if (anp->an_parent == NULL)
680		vp->v_vflag |= VV_ROOT;
681	vp->v_data = anp;
682
683	VN_LOCK_ASHARE(vp);
684
685	error = insmntque(vp, mp);
686	if (error != 0) {
687		AUTOFS_WARN("insmntque() failed with error %d", error);
688		sx_xunlock(&anp->an_vnode_lock);
689		return (error);
690	}
691
692	KASSERT(anp->an_vnode == NULL, ("lost race"));
693	anp->an_vnode = vp;
694
695	sx_xunlock(&anp->an_vnode_lock);
696
697	*vpp = vp;
698	return (0);
699}
700