zfs_ioctl.c revision 249319
1168404Spjd/*
2168404Spjd * CDDL HEADER START
3168404Spjd *
4168404Spjd * The contents of this file are subject to the terms of the
5168404Spjd * Common Development and Distribution License (the "License").
6168404Spjd * You may not use this file except in compliance with the License.
7168404Spjd *
8168404Spjd * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9168404Spjd * or http://www.opensolaris.org/os/licensing.
10168404Spjd * See the License for the specific language governing permissions
11168404Spjd * and limitations under the License.
12168404Spjd *
13168404Spjd * When distributing Covered Code, include this CDDL HEADER in each
14168404Spjd * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15168404Spjd * If applicable, add the following below this CDDL HEADER, with the
16168404Spjd * fields enclosed by brackets "[]" replaced with your own identifying
17168404Spjd * information: Portions Copyright [yyyy] [name of copyright owner]
18168404Spjd *
19168404Spjd * CDDL HEADER END
20168404Spjd */
21236884Smm
22168404Spjd/*
23219089Spjd * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24230438Spjd * Copyright (c) 2011-2012 Pawel Jakub Dawidek <pawel@dawidek.net>.
25226707Spjd * All rights reserved.
26247540Smm * Copyright 2013 Martin Matuska <mm@FreeBSD.org>. All rights reserved.
27228103Smm * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
28248571Smm * Copyright (c) 2012, Joyent, Inc. All rights reserved.
29249195Smm * Copyright (c) 2013 by Delphix. All rights reserved.
30246586Sdelphij * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
31168404Spjd */
32168404Spjd
33248571Smm/*
34248571Smm * ZFS ioctls.
35248571Smm *
36248571Smm * This file handles the ioctls to /dev/zfs, used for configuring ZFS storage
37248571Smm * pools and filesystems, e.g. with /sbin/zfs and /sbin/zpool.
38248571Smm *
39248571Smm * There are two ways that we handle ioctls: the legacy way where almost
40248571Smm * all of the logic is in the ioctl callback, and the new way where most
41248571Smm * of the marshalling is handled in the common entry point, zfsdev_ioctl().
42248571Smm *
43248571Smm * Non-legacy ioctls should be registered by calling
44248571Smm * zfs_ioctl_register() from zfs_ioctl_init().  The ioctl is invoked
45248571Smm * from userland by lzc_ioctl().
46248571Smm *
47248571Smm * The registration arguments are as follows:
48248571Smm *
49248571Smm * const char *name
50248571Smm *   The name of the ioctl.  This is used for history logging.  If the
51248571Smm *   ioctl returns successfully (the callback returns 0), and allow_log
52248571Smm *   is true, then a history log entry will be recorded with the input &
53248571Smm *   output nvlists.  The log entry can be printed with "zpool history -i".
54248571Smm *
55248571Smm * zfs_ioc_t ioc
56248571Smm *   The ioctl request number, which userland will pass to ioctl(2).
57248571Smm *   The ioctl numbers can change from release to release, because
58248571Smm *   the caller (libzfs) must be matched to the kernel.
59248571Smm *
60248571Smm * zfs_secpolicy_func_t *secpolicy
61248571Smm *   This function will be called before the zfs_ioc_func_t, to
62248571Smm *   determine if this operation is permitted.  It should return EPERM
63248571Smm *   on failure, and 0 on success.  Checks include determining if the
64248571Smm *   dataset is visible in this zone, and if the user has either all
65248571Smm *   zfs privileges in the zone (SYS_MOUNT), or has been granted permission
66248571Smm *   to do this operation on this dataset with "zfs allow".
67248571Smm *
68248571Smm * zfs_ioc_namecheck_t namecheck
69248571Smm *   This specifies what to expect in the zfs_cmd_t:zc_name -- a pool
70248571Smm *   name, a dataset name, or nothing.  If the name is not well-formed,
71248571Smm *   the ioctl will fail and the callback will not be called.
72248571Smm *   Therefore, the callback can assume that the name is well-formed
73248571Smm *   (e.g. is null-terminated, doesn't have more than one '@' character,
74248571Smm *   doesn't have invalid characters).
75248571Smm *
76248571Smm * zfs_ioc_poolcheck_t pool_check
77248571Smm *   This specifies requirements on the pool state.  If the pool does
78248571Smm *   not meet them (is suspended or is readonly), the ioctl will fail
79248571Smm *   and the callback will not be called.  If any checks are specified
80248571Smm *   (i.e. it is not POOL_CHECK_NONE), namecheck must not be NO_NAME.
81248571Smm *   Multiple checks can be or-ed together (e.g. POOL_CHECK_SUSPENDED |
82248571Smm *   POOL_CHECK_READONLY).
83248571Smm *
84248571Smm * boolean_t smush_outnvlist
85248571Smm *   If smush_outnvlist is true, then the output is presumed to be a
86248571Smm *   list of errors, and it will be "smushed" down to fit into the
87248571Smm *   caller's buffer, by removing some entries and replacing them with a
88248571Smm *   single "N_MORE_ERRORS" entry indicating how many were removed.  See
89248571Smm *   nvlist_smush() for details.  If smush_outnvlist is false, and the
90248571Smm *   outnvlist does not fit into the userland-provided buffer, then the
91248571Smm *   ioctl will fail with ENOMEM.
92248571Smm *
93248571Smm * zfs_ioc_func_t *func
94248571Smm *   The callback function that will perform the operation.
95248571Smm *
96248571Smm *   The callback should return 0 on success, or an error number on
97248571Smm *   failure.  If the function fails, the userland ioctl will return -1,
98248571Smm *   and errno will be set to the callback's return value.  The callback
99248571Smm *   will be called with the following arguments:
100248571Smm *
101248571Smm *   const char *name
102248571Smm *     The name of the pool or dataset to operate on, from
103248571Smm *     zfs_cmd_t:zc_name.  The 'namecheck' argument specifies the
104248571Smm *     expected type (pool, dataset, or none).
105248571Smm *
106248571Smm *   nvlist_t *innvl
107248571Smm *     The input nvlist, deserialized from zfs_cmd_t:zc_nvlist_src.  Or
108248571Smm *     NULL if no input nvlist was provided.  Changes to this nvlist are
109248571Smm *     ignored.  If the input nvlist could not be deserialized, the
110248571Smm *     ioctl will fail and the callback will not be called.
111248571Smm *
112248571Smm *   nvlist_t *outnvl
113248571Smm *     The output nvlist, initially empty.  The callback can fill it in,
114248571Smm *     and it will be returned to userland by serializing it into
115248571Smm *     zfs_cmd_t:zc_nvlist_dst.  If it is non-empty, and serialization
116248571Smm *     fails (e.g. because the caller didn't supply a large enough
117248571Smm *     buffer), then the overall ioctl will fail.  See the
118248571Smm *     'smush_nvlist' argument above for additional behaviors.
119248571Smm *
120248571Smm *     There are two typical uses of the output nvlist:
121248571Smm *       - To return state, e.g. property values.  In this case,
122248571Smm *         smush_outnvlist should be false.  If the buffer was not large
123248571Smm *         enough, the caller will reallocate a larger buffer and try
124248571Smm *         the ioctl again.
125248571Smm *
126248571Smm *       - To return multiple errors from an ioctl which makes on-disk
127248571Smm *         changes.  In this case, smush_outnvlist should be true.
128248571Smm *         Ioctls which make on-disk modifications should generally not
129248571Smm *         use the outnvl if they succeed, because the caller can not
130248571Smm *         distinguish between the operation failing, and
131248571Smm *         deserialization failing.
132248571Smm */
133248571Smm
134168962Spjd#include <sys/types.h>
135168404Spjd#include <sys/param.h>
136168404Spjd#include <sys/systm.h>
137168404Spjd#include <sys/conf.h>
138168404Spjd#include <sys/kernel.h>
139168404Spjd#include <sys/lock.h>
140168404Spjd#include <sys/malloc.h>
141168404Spjd#include <sys/mutex.h>
142168404Spjd#include <sys/proc.h>
143168404Spjd#include <sys/errno.h>
144168404Spjd#include <sys/uio.h>
145168962Spjd#include <sys/buf.h>
146168404Spjd#include <sys/file.h>
147168404Spjd#include <sys/kmem.h>
148168404Spjd#include <sys/conf.h>
149168404Spjd#include <sys/cmn_err.h>
150168404Spjd#include <sys/stat.h>
151168404Spjd#include <sys/zfs_ioctl.h>
152209962Smm#include <sys/zfs_vfsops.h>
153185029Spjd#include <sys/zfs_znode.h>
154168404Spjd#include <sys/zap.h>
155168404Spjd#include <sys/spa.h>
156168404Spjd#include <sys/spa_impl.h>
157168404Spjd#include <sys/vdev.h>
158168404Spjd#include <sys/dmu.h>
159168404Spjd#include <sys/dsl_dir.h>
160168404Spjd#include <sys/dsl_dataset.h>
161168404Spjd#include <sys/dsl_prop.h>
162185029Spjd#include <sys/dsl_deleg.h>
163185029Spjd#include <sys/dmu_objset.h>
164235222Smm#include <sys/dmu_impl.h>
165248571Smm#include <sys/dmu_tx.h>
166168962Spjd#include <sys/sunddi.h>
167168962Spjd#include <sys/policy.h>
168168962Spjd#include <sys/zone.h>
169168404Spjd#include <sys/nvpair.h>
170168404Spjd#include <sys/mount.h>
171168404Spjd#include <sys/taskqueue.h>
172168404Spjd#include <sys/sdt.h>
173168404Spjd#include <sys/varargs.h>
174168404Spjd#include <sys/fs/zfs.h>
175168404Spjd#include <sys/zfs_ctldir.h>
176185029Spjd#include <sys/zfs_dir.h>
177219089Spjd#include <sys/zfs_onexit.h>
178168404Spjd#include <sys/zvol.h>
179219089Spjd#include <sys/dsl_scan.h>
180185029Spjd#include <sys/dmu_objset.h>
181248571Smm#include <sys/dmu_send.h>
182248571Smm#include <sys/dsl_destroy.h>
183248571Smm#include <sys/dsl_userhold.h>
184246586Sdelphij#include <sys/zfeature.h>
185168404Spjd
186168404Spjd#include "zfs_namecheck.h"
187168404Spjd#include "zfs_prop.h"
188185029Spjd#include "zfs_deleg.h"
189219089Spjd#include "zfs_comutil.h"
190219089Spjd#include "zfs_ioctl_compat.h"
191168404Spjd
192219089SpjdCTASSERT(sizeof(zfs_cmd_t) < IOCPARM_MAX);
193168404Spjd
194230397Spjdstatic int snapshot_list_prefetch;
195230397SpjdSYSCTL_DECL(_vfs_zfs);
196230397SpjdTUNABLE_INT("vfs.zfs.snapshot_list_prefetch", &snapshot_list_prefetch);
197230397SpjdSYSCTL_INT(_vfs_zfs, OID_AUTO, snapshot_list_prefetch, CTLFLAG_RW,
198230397Spjd    &snapshot_list_prefetch, 0, "Prefetch data when listing snapshots");
199230397Spjd
200168404Spjdstatic struct cdev *zfsdev;
201168404Spjd
202168404Spjdextern void zfs_init(void);
203168404Spjdextern void zfs_fini(void);
204168404Spjd
205248571Smmuint_t zfs_fsyncer_key;
206248571Smmextern uint_t rrw_tsd_key;
207248571Smmstatic uint_t zfs_allow_log_key;
208168404Spjd
209248571Smmtypedef int zfs_ioc_legacy_func_t(zfs_cmd_t *);
210248571Smmtypedef int zfs_ioc_func_t(const char *, nvlist_t *, nvlist_t *);
211248571Smmtypedef int zfs_secpolicy_func_t(zfs_cmd_t *, nvlist_t *, cred_t *);
212248571Smm
213209962Smmtypedef enum {
214209962Smm	NO_NAME,
215209962Smm	POOL_NAME,
216209962Smm	DATASET_NAME
217209962Smm} zfs_ioc_namecheck_t;
218209962Smm
219246688Smmtypedef enum {
220246688Smm	POOL_CHECK_NONE		= 1 << 0,
221246688Smm	POOL_CHECK_SUSPENDED	= 1 << 1,
222248571Smm	POOL_CHECK_READONLY	= 1 << 2,
223246688Smm} zfs_ioc_poolcheck_t;
224246688Smm
225168404Spjdtypedef struct zfs_ioc_vec {
226248571Smm	zfs_ioc_legacy_func_t	*zvec_legacy_func;
227168404Spjd	zfs_ioc_func_t		*zvec_func;
228168404Spjd	zfs_secpolicy_func_t	*zvec_secpolicy;
229209962Smm	zfs_ioc_namecheck_t	zvec_namecheck;
230248571Smm	boolean_t		zvec_allow_log;
231246688Smm	zfs_ioc_poolcheck_t	zvec_pool_check;
232248571Smm	boolean_t		zvec_smush_outnvlist;
233248571Smm	const char		*zvec_name;
234168404Spjd} zfs_ioc_vec_t;
235168404Spjd
236209962Smm/* This array is indexed by zfs_userquota_prop_t */
237209962Smmstatic const char *userquota_perms[] = {
238209962Smm	ZFS_DELEG_PERM_USERUSED,
239209962Smm	ZFS_DELEG_PERM_USERQUOTA,
240209962Smm	ZFS_DELEG_PERM_GROUPUSED,
241209962Smm	ZFS_DELEG_PERM_GROUPQUOTA,
242209962Smm};
243209962Smm
244209962Smmstatic int zfs_ioc_userspace_upgrade(zfs_cmd_t *zc);
245219089Spjdstatic int zfs_check_settable(const char *name, nvpair_t *property,
246219089Spjd    cred_t *cr);
247219089Spjdstatic int zfs_check_clearable(char *dataset, nvlist_t *props,
248219089Spjd    nvlist_t **errors);
249185029Spjdstatic int zfs_fill_zplprops_root(uint64_t, nvlist_t *, nvlist_t *,
250185029Spjd    boolean_t *);
251248571Smmint zfs_set_prop_nvlist(const char *, zprop_source_t, nvlist_t *, nvlist_t *);
252248571Smmstatic int get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp);
253219089Spjd
254219089Spjdstatic void zfsdev_close(void *data);
255185029Spjd
256248571Smmstatic int zfs_prop_activate_feature(spa_t *spa, zfeature_info_t *feature);
257246586Sdelphij
258168404Spjd/* _NOTE(PRINTFLIKE(4)) - this is printf-like, but lint is too whiney */
259168404Spjdvoid
260168404Spjd__dprintf(const char *file, const char *func, int line, const char *fmt, ...)
261168404Spjd{
262168404Spjd	const char *newfile;
263219089Spjd	char buf[512];
264168404Spjd	va_list adx;
265168404Spjd
266168404Spjd	/*
267168404Spjd	 * Get rid of annoying "../common/" prefix to filename.
268168404Spjd	 */
269168404Spjd	newfile = strrchr(file, '/');
270168404Spjd	if (newfile != NULL) {
271168404Spjd		newfile = newfile + 1; /* Get rid of leading / */
272168404Spjd	} else {
273168404Spjd		newfile = file;
274168404Spjd	}
275168404Spjd
276168404Spjd	va_start(adx, fmt);
277168404Spjd	(void) vsnprintf(buf, sizeof (buf), fmt, adx);
278168404Spjd	va_end(adx);
279168404Spjd
280168404Spjd	/*
281168404Spjd	 * To get this data, use the zfs-dprintf probe as so:
282168404Spjd	 * dtrace -q -n 'zfs-dprintf \
283168404Spjd	 *	/stringof(arg0) == "dbuf.c"/ \
284168404Spjd	 *	{printf("%s: %s", stringof(arg1), stringof(arg3))}'
285168404Spjd	 * arg0 = file name
286168404Spjd	 * arg1 = function name
287168404Spjd	 * arg2 = line number
288168404Spjd	 * arg3 = message
289168404Spjd	 */
290168404Spjd	DTRACE_PROBE4(zfs__dprintf,
291168404Spjd	    char *, newfile, char *, func, int, line, char *, buf);
292168404Spjd}
293168404Spjd
294185029Spjdstatic void
295185029Spjdhistory_str_free(char *buf)
296185029Spjd{
297185029Spjd	kmem_free(buf, HIS_MAX_RECORD_LEN);
298185029Spjd}
299185029Spjd
300185029Spjdstatic char *
301185029Spjdhistory_str_get(zfs_cmd_t *zc)
302185029Spjd{
303185029Spjd	char *buf;
304185029Spjd
305185029Spjd	if (zc->zc_history == 0)
306185029Spjd		return (NULL);
307185029Spjd
308185029Spjd	buf = kmem_alloc(HIS_MAX_RECORD_LEN, KM_SLEEP);
309185029Spjd	if (copyinstr((void *)(uintptr_t)zc->zc_history,
310185029Spjd	    buf, HIS_MAX_RECORD_LEN, NULL) != 0) {
311185029Spjd		history_str_free(buf);
312185029Spjd		return (NULL);
313185029Spjd	}
314185029Spjd
315185029Spjd	buf[HIS_MAX_RECORD_LEN -1] = '\0';
316185029Spjd
317185029Spjd	return (buf);
318185029Spjd}
319185029Spjd
320168404Spjd/*
321185029Spjd * Check to see if the named dataset is currently defined as bootable
322185029Spjd */
323185029Spjdstatic boolean_t
324185029Spjdzfs_is_bootfs(const char *name)
325185029Spjd{
326219089Spjd	objset_t *os;
327185029Spjd
328219089Spjd	if (dmu_objset_hold(name, FTAG, &os) == 0) {
329219089Spjd		boolean_t ret;
330219089Spjd		ret = (dmu_objset_id(os) == spa_bootfs(dmu_objset_spa(os)));
331219089Spjd		dmu_objset_rele(os, FTAG);
332219089Spjd		return (ret);
333185029Spjd	}
334219089Spjd	return (B_FALSE);
335185029Spjd}
336185029Spjd
337185029Spjd/*
338185029Spjd * zfs_earlier_version
339185029Spjd *
340185029Spjd *	Return non-zero if the spa version is less than requested version.
341185029Spjd */
342185029Spjdstatic int
343185029Spjdzfs_earlier_version(const char *name, int version)
344185029Spjd{
345185029Spjd	spa_t *spa;
346185029Spjd
347185029Spjd	if (spa_open(name, &spa, FTAG) == 0) {
348185029Spjd		if (spa_version(spa) < version) {
349185029Spjd			spa_close(spa, FTAG);
350185029Spjd			return (1);
351185029Spjd		}
352185029Spjd		spa_close(spa, FTAG);
353185029Spjd	}
354185029Spjd	return (0);
355185029Spjd}
356185029Spjd
357185029Spjd/*
358185029Spjd * zpl_earlier_version
359185029Spjd *
360185029Spjd * Return TRUE if the ZPL version is less than requested version.
361185029Spjd */
362185029Spjdstatic boolean_t
363185029Spjdzpl_earlier_version(const char *name, int version)
364185029Spjd{
365185029Spjd	objset_t *os;
366185029Spjd	boolean_t rc = B_TRUE;
367185029Spjd
368219089Spjd	if (dmu_objset_hold(name, FTAG, &os) == 0) {
369185029Spjd		uint64_t zplversion;
370185029Spjd
371219089Spjd		if (dmu_objset_type(os) != DMU_OST_ZFS) {
372219089Spjd			dmu_objset_rele(os, FTAG);
373219089Spjd			return (B_TRUE);
374219089Spjd		}
375219089Spjd		/* XXX reading from non-owned objset */
376185029Spjd		if (zfs_get_zplprop(os, ZFS_PROP_VERSION, &zplversion) == 0)
377185029Spjd			rc = zplversion < version;
378219089Spjd		dmu_objset_rele(os, FTAG);
379185029Spjd	}
380185029Spjd	return (rc);
381185029Spjd}
382185029Spjd
383185029Spjdstatic void
384185029Spjdzfs_log_history(zfs_cmd_t *zc)
385185029Spjd{
386185029Spjd	spa_t *spa;
387185029Spjd	char *buf;
388185029Spjd
389185029Spjd	if ((buf = history_str_get(zc)) == NULL)
390185029Spjd		return;
391185029Spjd
392185029Spjd	if (spa_open(zc->zc_name, &spa, FTAG) == 0) {
393185029Spjd		if (spa_version(spa) >= SPA_VERSION_ZPOOL_HISTORY)
394248571Smm			(void) spa_history_log(spa, buf);
395185029Spjd		spa_close(spa, FTAG);
396185029Spjd	}
397185029Spjd	history_str_free(buf);
398185029Spjd}
399185029Spjd
400185029Spjd/*
401168404Spjd * Policy for top-level read operations (list pools).  Requires no privileges,
402168404Spjd * and can be used in the local zone, as there is no associated dataset.
403168404Spjd */
404168404Spjd/* ARGSUSED */
405168404Spjdstatic int
406248571Smmzfs_secpolicy_none(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
407168404Spjd{
408168404Spjd	return (0);
409168404Spjd}
410168404Spjd
411168404Spjd/*
412168404Spjd * Policy for dataset read operations (list children, get statistics).  Requires
413168404Spjd * no privileges, but must be visible in the local zone.
414168404Spjd */
415168404Spjd/* ARGSUSED */
416168404Spjdstatic int
417248571Smmzfs_secpolicy_read(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
418168404Spjd{
419185029Spjd	if (INGLOBALZONE(curthread) ||
420185029Spjd	    zone_dataset_visible(zc->zc_name, NULL))
421168404Spjd		return (0);
422168404Spjd
423249195Smm	return (SET_ERROR(ENOENT));
424168404Spjd}
425168404Spjd
426168404Spjdstatic int
427219089Spjdzfs_dozonecheck_impl(const char *dataset, uint64_t zoned, cred_t *cr)
428168404Spjd{
429168404Spjd	int writable = 1;
430168404Spjd
431168404Spjd	/*
432168404Spjd	 * The dataset must be visible by this zone -- check this first
433168404Spjd	 * so they don't see EPERM on something they shouldn't know about.
434168404Spjd	 */
435185029Spjd	if (!INGLOBALZONE(curthread) &&
436168404Spjd	    !zone_dataset_visible(dataset, &writable))
437249195Smm		return (SET_ERROR(ENOENT));
438168404Spjd
439185029Spjd	if (INGLOBALZONE(curthread)) {
440168404Spjd		/*
441168404Spjd		 * If the fs is zoned, only root can access it from the
442168404Spjd		 * global zone.
443168404Spjd		 */
444168404Spjd		if (secpolicy_zfs(cr) && zoned)
445249195Smm			return (SET_ERROR(EPERM));
446168404Spjd	} else {
447168404Spjd		/*
448168404Spjd		 * If we are in a local zone, the 'zoned' property must be set.
449168404Spjd		 */
450168404Spjd		if (!zoned)
451249195Smm			return (SET_ERROR(EPERM));
452168404Spjd
453168404Spjd		/* must be writable by this zone */
454168404Spjd		if (!writable)
455249195Smm			return (SET_ERROR(EPERM));
456168404Spjd	}
457168404Spjd	return (0);
458168404Spjd}
459168404Spjd
460219089Spjdstatic int
461219089Spjdzfs_dozonecheck(const char *dataset, cred_t *cr)
462219089Spjd{
463219089Spjd	uint64_t zoned;
464219089Spjd
465219089Spjd	if (dsl_prop_get_integer(dataset, "jailed", &zoned, NULL))
466249195Smm		return (SET_ERROR(ENOENT));
467219089Spjd
468219089Spjd	return (zfs_dozonecheck_impl(dataset, zoned, cr));
469219089Spjd}
470219089Spjd
471219089Spjdstatic int
472219089Spjdzfs_dozonecheck_ds(const char *dataset, dsl_dataset_t *ds, cred_t *cr)
473219089Spjd{
474219089Spjd	uint64_t zoned;
475219089Spjd
476248571Smm	if (dsl_prop_get_int_ds(ds, "jailed", &zoned))
477249195Smm		return (SET_ERROR(ENOENT));
478219089Spjd
479219089Spjd	return (zfs_dozonecheck_impl(dataset, zoned, cr));
480219089Spjd}
481219089Spjd
482248571Smmstatic int
483248571Smmzfs_secpolicy_write_perms_ds(const char *name, dsl_dataset_t *ds,
484248571Smm    const char *perm, cred_t *cr)
485168404Spjd{
486168404Spjd	int error;
487168404Spjd
488228103Smm	error = zfs_dozonecheck_ds(name, ds, cr);
489185029Spjd	if (error == 0) {
490185029Spjd		error = secpolicy_zfs(cr);
491248571Smm		if (error != 0)
492248571Smm			error = dsl_deleg_access_impl(ds, perm, cr);
493185029Spjd	}
494185029Spjd	return (error);
495185029Spjd}
496185029Spjd
497248571Smmstatic int
498248571Smmzfs_secpolicy_write_perms(const char *name, const char *perm, cred_t *cr)
499219089Spjd{
500219089Spjd	int error;
501248571Smm	dsl_dataset_t *ds;
502248571Smm	dsl_pool_t *dp;
503219089Spjd
504248571Smm	error = dsl_pool_hold(name, FTAG, &dp);
505248571Smm	if (error != 0)
506248571Smm		return (error);
507248571Smm
508248571Smm	error = dsl_dataset_hold(dp, name, FTAG, &ds);
509248571Smm	if (error != 0) {
510248571Smm		dsl_pool_rele(dp, FTAG);
511248571Smm		return (error);
512219089Spjd	}
513248571Smm
514248571Smm	error = zfs_secpolicy_write_perms_ds(name, ds, perm, cr);
515248571Smm
516248571Smm	dsl_dataset_rele(ds, FTAG);
517248571Smm	dsl_pool_rele(dp, FTAG);
518219089Spjd	return (error);
519219089Spjd}
520219089Spjd
521219089Spjd#ifdef SECLABEL
522219089Spjd/*
523219089Spjd * Policy for setting the security label property.
524219089Spjd *
525219089Spjd * Returns 0 for success, non-zero for access and other errors.
526219089Spjd */
527185029Spjdstatic int
528219089Spjdzfs_set_slabel_policy(const char *name, char *strval, cred_t *cr)
529185029Spjd{
530219089Spjd	char		ds_hexsl[MAXNAMELEN];
531219089Spjd	bslabel_t	ds_sl, new_sl;
532219089Spjd	boolean_t	new_default = FALSE;
533219089Spjd	uint64_t	zoned;
534219089Spjd	int		needed_priv = -1;
535219089Spjd	int		error;
536219089Spjd
537219089Spjd	/* First get the existing dataset label. */
538219089Spjd	error = dsl_prop_get(name, zfs_prop_to_name(ZFS_PROP_MLSLABEL),
539219089Spjd	    1, sizeof (ds_hexsl), &ds_hexsl, NULL);
540248571Smm	if (error != 0)
541249195Smm		return (SET_ERROR(EPERM));
542219089Spjd
543219089Spjd	if (strcasecmp(strval, ZFS_MLSLABEL_DEFAULT) == 0)
544219089Spjd		new_default = TRUE;
545219089Spjd
546219089Spjd	/* The label must be translatable */
547219089Spjd	if (!new_default && (hexstr_to_label(strval, &new_sl) != 0))
548249195Smm		return (SET_ERROR(EINVAL));
549219089Spjd
550185029Spjd	/*
551219089Spjd	 * In a non-global zone, disallow attempts to set a label that
552219089Spjd	 * doesn't match that of the zone; otherwise no other checks
553219089Spjd	 * are needed.
554219089Spjd	 */
555219089Spjd	if (!INGLOBALZONE(curproc)) {
556219089Spjd		if (new_default || !blequal(&new_sl, CR_SL(CRED())))
557249195Smm			return (SET_ERROR(EPERM));
558219089Spjd		return (0);
559219089Spjd	}
560219089Spjd
561219089Spjd	/*
562219089Spjd	 * For global-zone datasets (i.e., those whose zoned property is
563219089Spjd	 * "off", verify that the specified new label is valid for the
564219089Spjd	 * global zone.
565219089Spjd	 */
566219089Spjd	if (dsl_prop_get_integer(name,
567219089Spjd	    zfs_prop_to_name(ZFS_PROP_ZONED), &zoned, NULL))
568249195Smm		return (SET_ERROR(EPERM));
569219089Spjd	if (!zoned) {
570219089Spjd		if (zfs_check_global_label(name, strval) != 0)
571249195Smm			return (SET_ERROR(EPERM));
572219089Spjd	}
573219089Spjd
574219089Spjd	/*
575219089Spjd	 * If the existing dataset label is nondefault, check if the
576219089Spjd	 * dataset is mounted (label cannot be changed while mounted).
577219089Spjd	 * Get the zfsvfs; if there isn't one, then the dataset isn't
578219089Spjd	 * mounted (or isn't a dataset, doesn't exist, ...).
579219089Spjd	 */
580219089Spjd	if (strcasecmp(ds_hexsl, ZFS_MLSLABEL_DEFAULT) != 0) {
581219089Spjd		objset_t *os;
582219089Spjd		static char *setsl_tag = "setsl_tag";
583219089Spjd
584219089Spjd		/*
585219089Spjd		 * Try to own the dataset; abort if there is any error,
586219089Spjd		 * (e.g., already mounted, in use, or other error).
587219089Spjd		 */
588219089Spjd		error = dmu_objset_own(name, DMU_OST_ZFS, B_TRUE,
589219089Spjd		    setsl_tag, &os);
590248571Smm		if (error != 0)
591249195Smm			return (SET_ERROR(EPERM));
592219089Spjd
593219089Spjd		dmu_objset_disown(os, setsl_tag);
594219089Spjd
595219089Spjd		if (new_default) {
596219089Spjd			needed_priv = PRIV_FILE_DOWNGRADE_SL;
597219089Spjd			goto out_check;
598219089Spjd		}
599219089Spjd
600219089Spjd		if (hexstr_to_label(strval, &new_sl) != 0)
601249195Smm			return (SET_ERROR(EPERM));
602219089Spjd
603219089Spjd		if (blstrictdom(&ds_sl, &new_sl))
604219089Spjd			needed_priv = PRIV_FILE_DOWNGRADE_SL;
605219089Spjd		else if (blstrictdom(&new_sl, &ds_sl))
606219089Spjd			needed_priv = PRIV_FILE_UPGRADE_SL;
607219089Spjd	} else {
608219089Spjd		/* dataset currently has a default label */
609219089Spjd		if (!new_default)
610219089Spjd			needed_priv = PRIV_FILE_UPGRADE_SL;
611219089Spjd	}
612219089Spjd
613219089Spjdout_check:
614219089Spjd	if (needed_priv != -1)
615219089Spjd		return (PRIV_POLICY(cr, needed_priv, B_FALSE, EPERM, NULL));
616219089Spjd	return (0);
617219089Spjd}
618219089Spjd#endif	/* SECLABEL */
619219089Spjd
620219089Spjdstatic int
621219089Spjdzfs_secpolicy_setprop(const char *dsname, zfs_prop_t prop, nvpair_t *propval,
622219089Spjd    cred_t *cr)
623219089Spjd{
624219089Spjd	char *strval;
625219089Spjd
626219089Spjd	/*
627185029Spjd	 * Check permissions for special properties.
628185029Spjd	 */
629185029Spjd	switch (prop) {
630185029Spjd	case ZFS_PROP_ZONED:
631185029Spjd		/*
632185029Spjd		 * Disallow setting of 'zoned' from within a local zone.
633185029Spjd		 */
634185029Spjd		if (!INGLOBALZONE(curthread))
635249195Smm			return (SET_ERROR(EPERM));
636185029Spjd		break;
637185029Spjd
638185029Spjd	case ZFS_PROP_QUOTA:
639185029Spjd		if (!INGLOBALZONE(curthread)) {
640185029Spjd			uint64_t zoned;
641185029Spjd			char setpoint[MAXNAMELEN];
642185029Spjd			/*
643185029Spjd			 * Unprivileged users are allowed to modify the
644185029Spjd			 * quota on things *under* (ie. contained by)
645185029Spjd			 * the thing they own.
646185029Spjd			 */
647219089Spjd			if (dsl_prop_get_integer(dsname, "jailed", &zoned,
648185029Spjd			    setpoint))
649249195Smm				return (SET_ERROR(EPERM));
650219089Spjd			if (!zoned || strlen(dsname) <= strlen(setpoint))
651249195Smm				return (SET_ERROR(EPERM));
652185029Spjd		}
653185029Spjd		break;
654219089Spjd
655219089Spjd	case ZFS_PROP_MLSLABEL:
656219089Spjd#ifdef SECLABEL
657219089Spjd		if (!is_system_labeled())
658249195Smm			return (SET_ERROR(EPERM));
659219089Spjd
660219089Spjd		if (nvpair_value_string(propval, &strval) == 0) {
661219089Spjd			int err;
662219089Spjd
663219089Spjd			err = zfs_set_slabel_policy(dsname, strval, CRED());
664219089Spjd			if (err != 0)
665219089Spjd				return (err);
666219089Spjd		}
667219089Spjd#else
668219089Spjd		return (EOPNOTSUPP);
669219089Spjd#endif
670219089Spjd		break;
671185029Spjd	}
672185029Spjd
673219089Spjd	return (zfs_secpolicy_write_perms(dsname, zfs_prop_to_name(prop), cr));
674185029Spjd}
675185029Spjd
676248571Smm/* ARGSUSED */
677248571Smmstatic int
678248571Smmzfs_secpolicy_set_fsacl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
679185029Spjd{
680185029Spjd	int error;
681185029Spjd
682185029Spjd	error = zfs_dozonecheck(zc->zc_name, cr);
683248571Smm	if (error != 0)
684168404Spjd		return (error);
685168404Spjd
686185029Spjd	/*
687185029Spjd	 * permission to set permissions will be evaluated later in
688185029Spjd	 * dsl_deleg_can_allow()
689185029Spjd	 */
690185029Spjd	return (0);
691168404Spjd}
692168404Spjd
693248571Smm/* ARGSUSED */
694248571Smmstatic int
695248571Smmzfs_secpolicy_rollback(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
696185029Spjd{
697219089Spjd	return (zfs_secpolicy_write_perms(zc->zc_name,
698219089Spjd	    ZFS_DELEG_PERM_ROLLBACK, cr));
699185029Spjd}
700185029Spjd
701248571Smm/* ARGSUSED */
702248571Smmstatic int
703248571Smmzfs_secpolicy_send(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
704185029Spjd{
705219089Spjd	dsl_pool_t *dp;
706219089Spjd	dsl_dataset_t *ds;
707219089Spjd	char *cp;
708219089Spjd	int error;
709219089Spjd
710219089Spjd	/*
711219089Spjd	 * Generate the current snapshot name from the given objsetid, then
712219089Spjd	 * use that name for the secpolicy/zone checks.
713219089Spjd	 */
714219089Spjd	cp = strchr(zc->zc_name, '@');
715219089Spjd	if (cp == NULL)
716249195Smm		return (SET_ERROR(EINVAL));
717248571Smm	error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
718248571Smm	if (error != 0)
719219089Spjd		return (error);
720219089Spjd
721219089Spjd	error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
722248571Smm	if (error != 0) {
723248571Smm		dsl_pool_rele(dp, FTAG);
724219089Spjd		return (error);
725248571Smm	}
726219089Spjd
727219089Spjd	dsl_dataset_name(ds, zc->zc_name);
728219089Spjd
729219089Spjd	error = zfs_secpolicy_write_perms_ds(zc->zc_name, ds,
730219089Spjd	    ZFS_DELEG_PERM_SEND, cr);
731219089Spjd	dsl_dataset_rele(ds, FTAG);
732248571Smm	dsl_pool_rele(dp, FTAG);
733219089Spjd
734219089Spjd	return (error);
735185029Spjd}
736185029Spjd
737248571Smm/* ARGSUSED */
738209962Smmstatic int
739248571Smmzfs_secpolicy_send_new(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
740209962Smm{
741248571Smm	return (zfs_secpolicy_write_perms(zc->zc_name,
742248571Smm	    ZFS_DELEG_PERM_SEND, cr));
743248571Smm}
744248571Smm
745248571Smm/* ARGSUSED */
746248571Smmstatic int
747248571Smmzfs_secpolicy_deleg_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
748248571Smm{
749209962Smm	vnode_t *vp;
750209962Smm	int error;
751209962Smm
752209962Smm	if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
753209962Smm	    NO_FOLLOW, NULL, &vp)) != 0)
754209962Smm		return (error);
755209962Smm
756209962Smm	/* Now make sure mntpnt and dataset are ZFS */
757209962Smm
758209962Smm	if (strcmp(vp->v_vfsp->mnt_stat.f_fstypename, "zfs") != 0 ||
759209962Smm	    (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
760209962Smm	    zc->zc_name) != 0)) {
761209962Smm		VN_RELE(vp);
762249195Smm		return (SET_ERROR(EPERM));
763209962Smm	}
764209962Smm
765209962Smm	VN_RELE(vp);
766209962Smm	return (dsl_deleg_access(zc->zc_name,
767209962Smm	    ZFS_DELEG_PERM_SHARE, cr));
768209962Smm}
769209962Smm
770185029Spjdint
771248571Smmzfs_secpolicy_share(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
772185029Spjd{
773185029Spjd	if (!INGLOBALZONE(curthread))
774249195Smm		return (SET_ERROR(EPERM));
775185029Spjd
776185029Spjd	if (secpolicy_nfs(cr) == 0) {
777185029Spjd		return (0);
778185029Spjd	} else {
779248571Smm		return (zfs_secpolicy_deleg_share(zc, innvl, cr));
780209962Smm	}
781209962Smm}
782185029Spjd
783209962Smmint
784248571Smmzfs_secpolicy_smb_acl(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
785209962Smm{
786209962Smm	if (!INGLOBALZONE(curthread))
787249195Smm		return (SET_ERROR(EPERM));
788185029Spjd
789209962Smm	if (secpolicy_smb(cr) == 0) {
790209962Smm		return (0);
791209962Smm	} else {
792248571Smm		return (zfs_secpolicy_deleg_share(zc, innvl, cr));
793185029Spjd	}
794185029Spjd}
795185029Spjd
796168404Spjdstatic int
797185029Spjdzfs_get_parent(const char *datasetname, char *parent, int parentsize)
798168404Spjd{
799168404Spjd	char *cp;
800168404Spjd
801168404Spjd	/*
802168404Spjd	 * Remove the @bla or /bla from the end of the name to get the parent.
803168404Spjd	 */
804185029Spjd	(void) strncpy(parent, datasetname, parentsize);
805185029Spjd	cp = strrchr(parent, '@');
806168404Spjd	if (cp != NULL) {
807168404Spjd		cp[0] = '\0';
808168404Spjd	} else {
809185029Spjd		cp = strrchr(parent, '/');
810168404Spjd		if (cp == NULL)
811249195Smm			return (SET_ERROR(ENOENT));
812168404Spjd		cp[0] = '\0';
813185029Spjd	}
814168404Spjd
815185029Spjd	return (0);
816185029Spjd}
817185029Spjd
818185029Spjdint
819185029Spjdzfs_secpolicy_destroy_perms(const char *name, cred_t *cr)
820185029Spjd{
821185029Spjd	int error;
822185029Spjd
823185029Spjd	if ((error = zfs_secpolicy_write_perms(name,
824185029Spjd	    ZFS_DELEG_PERM_MOUNT, cr)) != 0)
825185029Spjd		return (error);
826185029Spjd
827185029Spjd	return (zfs_secpolicy_write_perms(name, ZFS_DELEG_PERM_DESTROY, cr));
828185029Spjd}
829185029Spjd
830248571Smm/* ARGSUSED */
831185029Spjdstatic int
832248571Smmzfs_secpolicy_destroy(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
833185029Spjd{
834185029Spjd	return (zfs_secpolicy_destroy_perms(zc->zc_name, cr));
835185029Spjd}
836185029Spjd
837185029Spjd/*
838219089Spjd * Destroying snapshots with delegated permissions requires
839248571Smm * descendant mount and destroy permissions.
840185029Spjd */
841248571Smm/* ARGSUSED */
842185029Spjdstatic int
843248571Smmzfs_secpolicy_destroy_snaps(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
844185029Spjd{
845248571Smm	nvlist_t *snaps;
846248571Smm	nvpair_t *pair, *nextpair;
847248571Smm	int error = 0;
848219089Spjd
849248571Smm	if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
850249195Smm		return (SET_ERROR(EINVAL));
851248571Smm	for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
852248571Smm	    pair = nextpair) {
853248571Smm		dsl_pool_t *dp;
854248571Smm		dsl_dataset_t *ds;
855219089Spjd
856248571Smm		error = dsl_pool_hold(nvpair_name(pair), FTAG, &dp);
857248571Smm		if (error != 0)
858248571Smm			break;
859248571Smm		nextpair = nvlist_next_nvpair(snaps, pair);
860248571Smm		error = dsl_dataset_hold(dp, nvpair_name(pair), FTAG, &ds);
861248571Smm		if (error == 0)
862248571Smm			dsl_dataset_rele(ds, FTAG);
863248571Smm		dsl_pool_rele(dp, FTAG);
864219089Spjd
865248571Smm		if (error == 0) {
866248571Smm			error = zfs_secpolicy_destroy_perms(nvpair_name(pair),
867248571Smm			    cr);
868248571Smm		} else if (error == ENOENT) {
869248571Smm			/*
870248571Smm			 * Ignore any snapshots that don't exist (we consider
871248571Smm			 * them "already destroyed").  Remove the name from the
872248571Smm			 * nvl here in case the snapshot is created between
873248571Smm			 * now and when we try to destroy it (in which case
874248571Smm			 * we don't want to destroy it since we haven't
875248571Smm			 * checked for permission).
876248571Smm			 */
877248571Smm			fnvlist_remove_nvpair(snaps, pair);
878248571Smm			error = 0;
879248571Smm		}
880248571Smm		if (error != 0)
881248571Smm			break;
882248571Smm	}
883222050Smm
884219089Spjd	return (error);
885185029Spjd}
886185029Spjd
887185029Spjdint
888185029Spjdzfs_secpolicy_rename_perms(const char *from, const char *to, cred_t *cr)
889185029Spjd{
890219089Spjd	char	parentname[MAXNAMELEN];
891185029Spjd	int	error;
892185029Spjd
893185029Spjd	if ((error = zfs_secpolicy_write_perms(from,
894185029Spjd	    ZFS_DELEG_PERM_RENAME, cr)) != 0)
895185029Spjd		return (error);
896185029Spjd
897185029Spjd	if ((error = zfs_secpolicy_write_perms(from,
898185029Spjd	    ZFS_DELEG_PERM_MOUNT, cr)) != 0)
899185029Spjd		return (error);
900185029Spjd
901185029Spjd	if ((error = zfs_get_parent(to, parentname,
902185029Spjd	    sizeof (parentname))) != 0)
903185029Spjd		return (error);
904185029Spjd
905185029Spjd	if ((error = zfs_secpolicy_write_perms(parentname,
906185029Spjd	    ZFS_DELEG_PERM_CREATE, cr)) != 0)
907185029Spjd		return (error);
908185029Spjd
909185029Spjd	if ((error = zfs_secpolicy_write_perms(parentname,
910185029Spjd	    ZFS_DELEG_PERM_MOUNT, cr)) != 0)
911185029Spjd		return (error);
912185029Spjd
913185029Spjd	return (error);
914185029Spjd}
915185029Spjd
916248571Smm/* ARGSUSED */
917185029Spjdstatic int
918248571Smmzfs_secpolicy_rename(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
919185029Spjd{
920240870Spjd	char *at = NULL;
921240870Spjd	int error;
922240870Spjd
923240870Spjd	if ((zc->zc_cookie & 1) != 0) {
924240870Spjd		/*
925240870Spjd		 * This is recursive rename, so the starting snapshot might
926240870Spjd		 * not exist. Check file system or volume permission instead.
927240870Spjd		 */
928240870Spjd		at = strchr(zc->zc_name, '@');
929240870Spjd		if (at == NULL)
930240870Spjd			return (EINVAL);
931240870Spjd		*at = '\0';
932240870Spjd	}
933240870Spjd
934240870Spjd	error = zfs_secpolicy_rename_perms(zc->zc_name, zc->zc_value, cr);
935240870Spjd
936240870Spjd	if (at != NULL)
937240870Spjd		*at = '@';
938240870Spjd
939240870Spjd	return (error);
940185029Spjd}
941185029Spjd
942248571Smm/* ARGSUSED */
943185029Spjdstatic int
944248571Smmzfs_secpolicy_promote(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
945185029Spjd{
946248571Smm	dsl_pool_t *dp;
947248571Smm	dsl_dataset_t *clone;
948185029Spjd	int error;
949185029Spjd
950185029Spjd	error = zfs_secpolicy_write_perms(zc->zc_name,
951185029Spjd	    ZFS_DELEG_PERM_PROMOTE, cr);
952248571Smm	if (error != 0)
953185029Spjd		return (error);
954185029Spjd
955248571Smm	error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
956248571Smm	if (error != 0)
957248571Smm		return (error);
958185029Spjd
959248571Smm	error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &clone);
960248571Smm
961185029Spjd	if (error == 0) {
962248571Smm		char parentname[MAXNAMELEN];
963248571Smm		dsl_dataset_t *origin = NULL;
964185029Spjd		dsl_dir_t *dd;
965248571Smm		dd = clone->ds_dir;
966185029Spjd
967185029Spjd		error = dsl_dataset_hold_obj(dd->dd_pool,
968248571Smm		    dd->dd_phys->dd_origin_obj, FTAG, &origin);
969248571Smm		if (error != 0) {
970248571Smm			dsl_dataset_rele(clone, FTAG);
971248571Smm			dsl_pool_rele(dp, FTAG);
972185029Spjd			return (error);
973185029Spjd		}
974185029Spjd
975248571Smm		error = zfs_secpolicy_write_perms_ds(zc->zc_name, clone,
976185029Spjd		    ZFS_DELEG_PERM_MOUNT, cr);
977185029Spjd
978248571Smm		dsl_dataset_name(origin, parentname);
979248571Smm		if (error == 0) {
980248571Smm			error = zfs_secpolicy_write_perms_ds(parentname, origin,
981185029Spjd			    ZFS_DELEG_PERM_PROMOTE, cr);
982248571Smm		}
983248571Smm		dsl_dataset_rele(clone, FTAG);
984248571Smm		dsl_dataset_rele(origin, FTAG);
985168404Spjd	}
986248571Smm	dsl_pool_rele(dp, FTAG);
987185029Spjd	return (error);
988185029Spjd}
989168404Spjd
990248571Smm/* ARGSUSED */
991185029Spjdstatic int
992248571Smmzfs_secpolicy_recv(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
993185029Spjd{
994185029Spjd	int error;
995185029Spjd
996185029Spjd	if ((error = zfs_secpolicy_write_perms(zc->zc_name,
997185029Spjd	    ZFS_DELEG_PERM_RECEIVE, cr)) != 0)
998185029Spjd		return (error);
999185029Spjd
1000185029Spjd	if ((error = zfs_secpolicy_write_perms(zc->zc_name,
1001185029Spjd	    ZFS_DELEG_PERM_MOUNT, cr)) != 0)
1002185029Spjd		return (error);
1003185029Spjd
1004185029Spjd	return (zfs_secpolicy_write_perms(zc->zc_name,
1005185029Spjd	    ZFS_DELEG_PERM_CREATE, cr));
1006168404Spjd}
1007168404Spjd
1008185029Spjdint
1009185029Spjdzfs_secpolicy_snapshot_perms(const char *name, cred_t *cr)
1010185029Spjd{
1011219089Spjd	return (zfs_secpolicy_write_perms(name,
1012219089Spjd	    ZFS_DELEG_PERM_SNAPSHOT, cr));
1013185029Spjd}
1014185029Spjd
1015248571Smm/*
1016248571Smm * Check for permission to create each snapshot in the nvlist.
1017248571Smm */
1018248571Smm/* ARGSUSED */
1019185029Spjdstatic int
1020248571Smmzfs_secpolicy_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1021185029Spjd{
1022248571Smm	nvlist_t *snaps;
1023248571Smm	int error;
1024248571Smm	nvpair_t *pair;
1025185029Spjd
1026248571Smm	if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
1027249195Smm		return (SET_ERROR(EINVAL));
1028248571Smm	for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
1029248571Smm	    pair = nvlist_next_nvpair(snaps, pair)) {
1030248571Smm		char *name = nvpair_name(pair);
1031248571Smm		char *atp = strchr(name, '@');
1032248571Smm
1033248571Smm		if (atp == NULL) {
1034249195Smm			error = SET_ERROR(EINVAL);
1035248571Smm			break;
1036248571Smm		}
1037248571Smm		*atp = '\0';
1038248571Smm		error = zfs_secpolicy_snapshot_perms(name, cr);
1039248571Smm		*atp = '@';
1040248571Smm		if (error != 0)
1041248571Smm			break;
1042248571Smm	}
1043248571Smm	return (error);
1044185029Spjd}
1045185029Spjd
1046248571Smm/* ARGSUSED */
1047185029Spjdstatic int
1048248571Smmzfs_secpolicy_log_history(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1049185029Spjd{
1050248571Smm	/*
1051248571Smm	 * Even root must have a proper TSD so that we know what pool
1052248571Smm	 * to log to.
1053248571Smm	 */
1054248571Smm	if (tsd_get(zfs_allow_log_key) == NULL)
1055249195Smm		return (SET_ERROR(EPERM));
1056248571Smm	return (0);
1057248571Smm}
1058248571Smm
1059248571Smmstatic int
1060248571Smmzfs_secpolicy_create_clone(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1061248571Smm{
1062219089Spjd	char	parentname[MAXNAMELEN];
1063219089Spjd	int	error;
1064248571Smm	char	*origin;
1065185029Spjd
1066185029Spjd	if ((error = zfs_get_parent(zc->zc_name, parentname,
1067185029Spjd	    sizeof (parentname))) != 0)
1068185029Spjd		return (error);
1069185029Spjd
1070248571Smm	if (nvlist_lookup_string(innvl, "origin", &origin) == 0 &&
1071248571Smm	    (error = zfs_secpolicy_write_perms(origin,
1072248571Smm	    ZFS_DELEG_PERM_CLONE, cr)) != 0)
1073248571Smm		return (error);
1074185029Spjd
1075185029Spjd	if ((error = zfs_secpolicy_write_perms(parentname,
1076185029Spjd	    ZFS_DELEG_PERM_CREATE, cr)) != 0)
1077185029Spjd		return (error);
1078185029Spjd
1079248571Smm	return (zfs_secpolicy_write_perms(parentname,
1080248571Smm	    ZFS_DELEG_PERM_MOUNT, cr));
1081185029Spjd}
1082185029Spjd
1083168404Spjd/*
1084168404Spjd * Policy for pool operations - create/destroy pools, add vdevs, etc.  Requires
1085168404Spjd * SYS_CONFIG privilege, which is not available in a local zone.
1086168404Spjd */
1087168404Spjd/* ARGSUSED */
1088168404Spjdstatic int
1089248571Smmzfs_secpolicy_config(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1090168404Spjd{
1091168404Spjd	if (secpolicy_sys_config(cr, B_FALSE) != 0)
1092249195Smm		return (SET_ERROR(EPERM));
1093168404Spjd
1094168404Spjd	return (0);
1095168404Spjd}
1096168404Spjd
1097168404Spjd/*
1098219089Spjd * Policy for object to name lookups.
1099185029Spjd */
1100219089Spjd/* ARGSUSED */
1101185029Spjdstatic int
1102248571Smmzfs_secpolicy_diff(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1103185029Spjd{
1104219089Spjd	int error;
1105185029Spjd
1106219089Spjd	if ((error = secpolicy_sys_config(cr, B_FALSE)) == 0)
1107219089Spjd		return (0);
1108219089Spjd
1109219089Spjd	error = zfs_secpolicy_write_perms(zc->zc_name, ZFS_DELEG_PERM_DIFF, cr);
1110219089Spjd	return (error);
1111185029Spjd}
1112185029Spjd
1113185029Spjd/*
1114168404Spjd * Policy for fault injection.  Requires all privileges.
1115168404Spjd */
1116168404Spjd/* ARGSUSED */
1117168404Spjdstatic int
1118248571Smmzfs_secpolicy_inject(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1119168404Spjd{
1120168404Spjd	return (secpolicy_zinject(cr));
1121168404Spjd}
1122168404Spjd
1123248571Smm/* ARGSUSED */
1124185029Spjdstatic int
1125248571Smmzfs_secpolicy_inherit_prop(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1126185029Spjd{
1127185029Spjd	zfs_prop_t prop = zfs_name_to_prop(zc->zc_value);
1128185029Spjd
1129185029Spjd	if (prop == ZPROP_INVAL) {
1130185029Spjd		if (!zfs_prop_user(zc->zc_value))
1131249195Smm			return (SET_ERROR(EINVAL));
1132185029Spjd		return (zfs_secpolicy_write_perms(zc->zc_name,
1133185029Spjd		    ZFS_DELEG_PERM_USERPROP, cr));
1134185029Spjd	} else {
1135219089Spjd		return (zfs_secpolicy_setprop(zc->zc_name, prop,
1136219089Spjd		    NULL, cr));
1137185029Spjd	}
1138185029Spjd}
1139185029Spjd
1140168404Spjdstatic int
1141248571Smmzfs_secpolicy_userspace_one(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1142209962Smm{
1143248571Smm	int err = zfs_secpolicy_read(zc, innvl, cr);
1144209962Smm	if (err)
1145209962Smm		return (err);
1146209962Smm
1147209962Smm	if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1148249195Smm		return (SET_ERROR(EINVAL));
1149209962Smm
1150209962Smm	if (zc->zc_value[0] == 0) {
1151209962Smm		/*
1152209962Smm		 * They are asking about a posix uid/gid.  If it's
1153209962Smm		 * themself, allow it.
1154209962Smm		 */
1155209962Smm		if (zc->zc_objset_type == ZFS_PROP_USERUSED ||
1156209962Smm		    zc->zc_objset_type == ZFS_PROP_USERQUOTA) {
1157209962Smm			if (zc->zc_guid == crgetuid(cr))
1158209962Smm				return (0);
1159209962Smm		} else {
1160209962Smm			if (groupmember(zc->zc_guid, cr))
1161209962Smm				return (0);
1162209962Smm		}
1163209962Smm	}
1164209962Smm
1165209962Smm	return (zfs_secpolicy_write_perms(zc->zc_name,
1166209962Smm	    userquota_perms[zc->zc_objset_type], cr));
1167209962Smm}
1168209962Smm
1169209962Smmstatic int
1170248571Smmzfs_secpolicy_userspace_many(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1171209962Smm{
1172248571Smm	int err = zfs_secpolicy_read(zc, innvl, cr);
1173209962Smm	if (err)
1174209962Smm		return (err);
1175209962Smm
1176209962Smm	if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
1177249195Smm		return (SET_ERROR(EINVAL));
1178209962Smm
1179209962Smm	return (zfs_secpolicy_write_perms(zc->zc_name,
1180209962Smm	    userquota_perms[zc->zc_objset_type], cr));
1181209962Smm}
1182209962Smm
1183248571Smm/* ARGSUSED */
1184209962Smmstatic int
1185248571Smmzfs_secpolicy_userspace_upgrade(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1186209962Smm{
1187219089Spjd	return (zfs_secpolicy_setprop(zc->zc_name, ZFS_PROP_VERSION,
1188219089Spjd	    NULL, cr));
1189209962Smm}
1190209962Smm
1191248571Smm/* ARGSUSED */
1192219089Spjdstatic int
1193248571Smmzfs_secpolicy_hold(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1194219089Spjd{
1195248571Smm	nvpair_t *pair;
1196248571Smm	nvlist_t *holds;
1197248571Smm	int error;
1198248571Smm
1199248571Smm	error = nvlist_lookup_nvlist(innvl, "holds", &holds);
1200248571Smm	if (error != 0)
1201249195Smm		return (SET_ERROR(EINVAL));
1202248571Smm
1203248571Smm	for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
1204248571Smm	    pair = nvlist_next_nvpair(holds, pair)) {
1205248571Smm		char fsname[MAXNAMELEN];
1206248571Smm		error = dmu_fsname(nvpair_name(pair), fsname);
1207248571Smm		if (error != 0)
1208248571Smm			return (error);
1209248571Smm		error = zfs_secpolicy_write_perms(fsname,
1210248571Smm		    ZFS_DELEG_PERM_HOLD, cr);
1211248571Smm		if (error != 0)
1212248571Smm			return (error);
1213248571Smm	}
1214248571Smm	return (0);
1215219089Spjd}
1216219089Spjd
1217248571Smm/* ARGSUSED */
1218219089Spjdstatic int
1219248571Smmzfs_secpolicy_release(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1220219089Spjd{
1221248571Smm	nvpair_t *pair;
1222248571Smm	int error;
1223248571Smm
1224248571Smm	for (pair = nvlist_next_nvpair(innvl, NULL); pair != NULL;
1225248571Smm	    pair = nvlist_next_nvpair(innvl, pair)) {
1226248571Smm		char fsname[MAXNAMELEN];
1227248571Smm		error = dmu_fsname(nvpair_name(pair), fsname);
1228248571Smm		if (error != 0)
1229248571Smm			return (error);
1230248571Smm		error = zfs_secpolicy_write_perms(fsname,
1231248571Smm		    ZFS_DELEG_PERM_RELEASE, cr);
1232248571Smm		if (error != 0)
1233248571Smm			return (error);
1234248571Smm	}
1235248571Smm	return (0);
1236219089Spjd}
1237219089Spjd
1238168404Spjd/*
1239219089Spjd * Policy for allowing temporary snapshots to be taken or released
1240219089Spjd */
1241219089Spjdstatic int
1242248571Smmzfs_secpolicy_tmp_snapshot(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
1243219089Spjd{
1244219089Spjd	/*
1245219089Spjd	 * A temporary snapshot is the same as a snapshot,
1246219089Spjd	 * hold, destroy and release all rolled into one.
1247219089Spjd	 * Delegated diff alone is sufficient that we allow this.
1248219089Spjd	 */
1249219089Spjd	int error;
1250219089Spjd
1251219089Spjd	if ((error = zfs_secpolicy_write_perms(zc->zc_name,
1252219089Spjd	    ZFS_DELEG_PERM_DIFF, cr)) == 0)
1253219089Spjd		return (0);
1254219089Spjd
1255248571Smm	error = zfs_secpolicy_snapshot_perms(zc->zc_name, cr);
1256248571Smm	if (error == 0)
1257248571Smm		error = zfs_secpolicy_hold(zc, innvl, cr);
1258248571Smm	if (error == 0)
1259248571Smm		error = zfs_secpolicy_release(zc, innvl, cr);
1260248571Smm	if (error == 0)
1261248571Smm		error = zfs_secpolicy_destroy(zc, innvl, cr);
1262219089Spjd	return (error);
1263219089Spjd}
1264219089Spjd
1265219089Spjd/*
1266168404Spjd * Returns the nvlist as specified by the user in the zfs_cmd_t.
1267168404Spjd */
1268168404Spjdstatic int
1269219089Spjdget_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp)
1270168404Spjd{
1271168404Spjd	char *packed;
1272168404Spjd	int error;
1273185029Spjd	nvlist_t *list = NULL;
1274168404Spjd
1275168404Spjd	/*
1276168404Spjd	 * Read in and unpack the user-supplied nvlist.
1277168404Spjd	 */
1278185029Spjd	if (size == 0)
1279249195Smm		return (SET_ERROR(EINVAL));
1280168404Spjd
1281168404Spjd	packed = kmem_alloc(size, KM_SLEEP);
1282168404Spjd
1283219089Spjd	if ((error = ddi_copyin((void *)(uintptr_t)nvl, packed, size,
1284219089Spjd	    iflag)) != 0) {
1285168404Spjd		kmem_free(packed, size);
1286168404Spjd		return (error);
1287168404Spjd	}
1288168404Spjd
1289185029Spjd	if ((error = nvlist_unpack(packed, size, &list, 0)) != 0) {
1290168404Spjd		kmem_free(packed, size);
1291168404Spjd		return (error);
1292168404Spjd	}
1293168404Spjd
1294168404Spjd	kmem_free(packed, size);
1295168404Spjd
1296185029Spjd	*nvp = list;
1297168404Spjd	return (0);
1298168404Spjd}
1299168404Spjd
1300248571Smm/*
1301248571Smm * Reduce the size of this nvlist until it can be serialized in 'max' bytes.
1302248571Smm * Entries will be removed from the end of the nvlist, and one int32 entry
1303248571Smm * named "N_MORE_ERRORS" will be added indicating how many entries were
1304248571Smm * removed.
1305248571Smm */
1306168404Spjdstatic int
1307248571Smmnvlist_smush(nvlist_t *errors, size_t max)
1308219089Spjd{
1309219089Spjd	size_t size;
1310219089Spjd
1311248571Smm	size = fnvlist_size(errors);
1312219089Spjd
1313248571Smm	if (size > max) {
1314219089Spjd		nvpair_t *more_errors;
1315219089Spjd		int n = 0;
1316219089Spjd
1317248571Smm		if (max < 1024)
1318249195Smm			return (SET_ERROR(ENOMEM));
1319219089Spjd
1320248571Smm		fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, 0);
1321248571Smm		more_errors = nvlist_prev_nvpair(errors, NULL);
1322219089Spjd
1323219089Spjd		do {
1324248571Smm			nvpair_t *pair = nvlist_prev_nvpair(errors,
1325219089Spjd			    more_errors);
1326248571Smm			fnvlist_remove_nvpair(errors, pair);
1327219089Spjd			n++;
1328248571Smm			size = fnvlist_size(errors);
1329248571Smm		} while (size > max);
1330219089Spjd
1331248571Smm		fnvlist_remove_nvpair(errors, more_errors);
1332248571Smm		fnvlist_add_int32(errors, ZPROP_N_MORE_ERRORS, n);
1333248571Smm		ASSERT3U(fnvlist_size(errors), <=, max);
1334219089Spjd	}
1335219089Spjd
1336219089Spjd	return (0);
1337219089Spjd}
1338219089Spjd
1339219089Spjdstatic int
1340168404Spjdput_nvlist(zfs_cmd_t *zc, nvlist_t *nvl)
1341168404Spjd{
1342168404Spjd	char *packed = NULL;
1343219089Spjd	int error = 0;
1344168404Spjd	size_t size;
1345168404Spjd
1346248571Smm	size = fnvlist_size(nvl);
1347168404Spjd
1348168404Spjd	if (size > zc->zc_nvlist_dst_size) {
1349168404Spjd		/*
1350168404Spjd		 * Solaris returns ENOMEM here, because even if an error is
1351168404Spjd		 * returned from an ioctl(2), new zc_nvlist_dst_size will be
1352168404Spjd		 * passed to the userland. This is not the case for FreeBSD.
1353168404Spjd		 * We need to return 0, so the kernel will copy the
1354168404Spjd		 * zc_nvlist_dst_size back and the userland can discover that a
1355168404Spjd		 * bigger buffer is needed.
1356168404Spjd		 */
1357168404Spjd		error = 0;
1358168404Spjd	} else {
1359248571Smm		packed = fnvlist_pack(nvl, &size);
1360219089Spjd		if (ddi_copyout(packed, (void *)(uintptr_t)zc->zc_nvlist_dst,
1361219089Spjd		    size, zc->zc_iflags) != 0)
1362249195Smm			error = SET_ERROR(EFAULT);
1363248571Smm		fnvlist_pack_free(packed, size);
1364168404Spjd	}
1365168404Spjd
1366168404Spjd	zc->zc_nvlist_dst_size = size;
1367248571Smm	zc->zc_nvlist_dst_filled = B_TRUE;
1368168404Spjd	return (error);
1369168404Spjd}
1370168404Spjd
1371168404Spjdstatic int
1372219089Spjdgetzfsvfs(const char *dsname, zfsvfs_t **zfvp)
1373209962Smm{
1374209962Smm	objset_t *os;
1375209962Smm	int error;
1376209962Smm
1377219089Spjd	error = dmu_objset_hold(dsname, FTAG, &os);
1378248571Smm	if (error != 0)
1379209962Smm		return (error);
1380219089Spjd	if (dmu_objset_type(os) != DMU_OST_ZFS) {
1381219089Spjd		dmu_objset_rele(os, FTAG);
1382249195Smm		return (SET_ERROR(EINVAL));
1383219089Spjd	}
1384209962Smm
1385219089Spjd	mutex_enter(&os->os_user_ptr_lock);
1386219089Spjd	*zfvp = dmu_objset_get_user(os);
1387219089Spjd	if (*zfvp) {
1388219089Spjd		VFS_HOLD((*zfvp)->z_vfs);
1389209962Smm	} else {
1390249195Smm		error = SET_ERROR(ESRCH);
1391209962Smm	}
1392219089Spjd	mutex_exit(&os->os_user_ptr_lock);
1393219089Spjd	dmu_objset_rele(os, FTAG);
1394209962Smm	return (error);
1395209962Smm}
1396209962Smm
1397209962Smm/*
1398209962Smm * Find a zfsvfs_t for a mounted filesystem, or create our own, in which
1399209962Smm * case its z_vfs will be NULL, and it will be opened as the owner.
1400236884Smm * If 'writer' is set, the z_teardown_lock will be held for RW_WRITER,
1401236884Smm * which prevents all vnode ops from running.
1402209962Smm */
1403209962Smmstatic int
1404219089Spjdzfsvfs_hold(const char *name, void *tag, zfsvfs_t **zfvp, boolean_t writer)
1405209962Smm{
1406209962Smm	int error = 0;
1407209962Smm
1408219089Spjd	if (getzfsvfs(name, zfvp) != 0)
1409219089Spjd		error = zfsvfs_create(name, zfvp);
1410209962Smm	if (error == 0) {
1411219089Spjd		rrw_enter(&(*zfvp)->z_teardown_lock, (writer) ? RW_WRITER :
1412219089Spjd		    RW_READER, tag);
1413219089Spjd		if ((*zfvp)->z_unmounted) {
1414209962Smm			/*
1415209962Smm			 * XXX we could probably try again, since the unmounting
1416209962Smm			 * thread should be just about to disassociate the
1417209962Smm			 * objset from the zfsvfs.
1418209962Smm			 */
1419219089Spjd			rrw_exit(&(*zfvp)->z_teardown_lock, tag);
1420249195Smm			return (SET_ERROR(EBUSY));
1421209962Smm		}
1422209962Smm	}
1423209962Smm	return (error);
1424209962Smm}
1425209962Smm
1426209962Smmstatic void
1427209962Smmzfsvfs_rele(zfsvfs_t *zfsvfs, void *tag)
1428209962Smm{
1429209962Smm	rrw_exit(&zfsvfs->z_teardown_lock, tag);
1430209962Smm
1431209962Smm	if (zfsvfs->z_vfs) {
1432209962Smm		VFS_RELE(zfsvfs->z_vfs);
1433209962Smm	} else {
1434219089Spjd		dmu_objset_disown(zfsvfs->z_os, zfsvfs);
1435209962Smm		zfsvfs_free(zfsvfs);
1436209962Smm	}
1437209962Smm}
1438209962Smm
1439209962Smmstatic int
1440168404Spjdzfs_ioc_pool_create(zfs_cmd_t *zc)
1441168404Spjd{
1442168404Spjd	int error;
1443185029Spjd	nvlist_t *config, *props = NULL;
1444185029Spjd	nvlist_t *rootprops = NULL;
1445185029Spjd	nvlist_t *zplprops = NULL;
1446168404Spjd
1447185029Spjd	if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1448219089Spjd	    zc->zc_iflags, &config))
1449168404Spjd		return (error);
1450168404Spjd
1451185029Spjd	if (zc->zc_nvlist_src_size != 0 && (error =
1452219089Spjd	    get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1453219089Spjd	    zc->zc_iflags, &props))) {
1454185029Spjd		nvlist_free(config);
1455185029Spjd		return (error);
1456185029Spjd	}
1457168404Spjd
1458185029Spjd	if (props) {
1459185029Spjd		nvlist_t *nvl = NULL;
1460185029Spjd		uint64_t version = SPA_VERSION;
1461185029Spjd
1462185029Spjd		(void) nvlist_lookup_uint64(props,
1463185029Spjd		    zpool_prop_to_name(ZPOOL_PROP_VERSION), &version);
1464236884Smm		if (!SPA_VERSION_IS_SUPPORTED(version)) {
1465249195Smm			error = SET_ERROR(EINVAL);
1466185029Spjd			goto pool_props_bad;
1467185029Spjd		}
1468185029Spjd		(void) nvlist_lookup_nvlist(props, ZPOOL_ROOTFS_PROPS, &nvl);
1469185029Spjd		if (nvl) {
1470185029Spjd			error = nvlist_dup(nvl, &rootprops, KM_SLEEP);
1471185029Spjd			if (error != 0) {
1472185029Spjd				nvlist_free(config);
1473185029Spjd				nvlist_free(props);
1474185029Spjd				return (error);
1475185029Spjd			}
1476185029Spjd			(void) nvlist_remove_all(props, ZPOOL_ROOTFS_PROPS);
1477185029Spjd		}
1478185029Spjd		VERIFY(nvlist_alloc(&zplprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1479185029Spjd		error = zfs_fill_zplprops_root(version, rootprops,
1480185029Spjd		    zplprops, NULL);
1481248571Smm		if (error != 0)
1482185029Spjd			goto pool_props_bad;
1483185029Spjd	}
1484185029Spjd
1485248571Smm	error = spa_create(zc->zc_name, config, props, zplprops);
1486185029Spjd
1487185029Spjd	/*
1488185029Spjd	 * Set the remaining root properties
1489185029Spjd	 */
1490219089Spjd	if (!error && (error = zfs_set_prop_nvlist(zc->zc_name,
1491219089Spjd	    ZPROP_SRC_LOCAL, rootprops, NULL)) != 0)
1492185029Spjd		(void) spa_destroy(zc->zc_name);
1493185029Spjd
1494185029Spjdpool_props_bad:
1495185029Spjd	nvlist_free(rootprops);
1496185029Spjd	nvlist_free(zplprops);
1497168404Spjd	nvlist_free(config);
1498185029Spjd	nvlist_free(props);
1499168404Spjd
1500168404Spjd	return (error);
1501168404Spjd}
1502168404Spjd
1503168404Spjdstatic int
1504168404Spjdzfs_ioc_pool_destroy(zfs_cmd_t *zc)
1505168404Spjd{
1506185029Spjd	int error;
1507185029Spjd	zfs_log_history(zc);
1508185029Spjd	error = spa_destroy(zc->zc_name);
1509219089Spjd	if (error == 0)
1510219089Spjd		zvol_remove_minors(zc->zc_name);
1511185029Spjd	return (error);
1512168404Spjd}
1513168404Spjd
1514168404Spjdstatic int
1515168404Spjdzfs_ioc_pool_import(zfs_cmd_t *zc)
1516168404Spjd{
1517185029Spjd	nvlist_t *config, *props = NULL;
1518168404Spjd	uint64_t guid;
1519219089Spjd	int error;
1520168404Spjd
1521185029Spjd	if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1522219089Spjd	    zc->zc_iflags, &config)) != 0)
1523168404Spjd		return (error);
1524168404Spjd
1525185029Spjd	if (zc->zc_nvlist_src_size != 0 && (error =
1526219089Spjd	    get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1527219089Spjd	    zc->zc_iflags, &props))) {
1528185029Spjd		nvlist_free(config);
1529185029Spjd		return (error);
1530185029Spjd	}
1531185029Spjd
1532168404Spjd	if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID, &guid) != 0 ||
1533168404Spjd	    guid != zc->zc_guid)
1534249195Smm		error = SET_ERROR(EINVAL);
1535168404Spjd	else
1536219089Spjd		error = spa_import(zc->zc_name, config, props, zc->zc_cookie);
1537168404Spjd
1538219089Spjd	if (zc->zc_nvlist_dst != 0) {
1539219089Spjd		int err;
1540219089Spjd
1541219089Spjd		if ((err = put_nvlist(zc, config)) != 0)
1542219089Spjd			error = err;
1543219089Spjd	}
1544219089Spjd
1545168404Spjd	nvlist_free(config);
1546168404Spjd
1547185029Spjd	if (props)
1548185029Spjd		nvlist_free(props);
1549185029Spjd
1550168404Spjd	return (error);
1551168404Spjd}
1552168404Spjd
1553168404Spjdstatic int
1554168404Spjdzfs_ioc_pool_export(zfs_cmd_t *zc)
1555168404Spjd{
1556185029Spjd	int error;
1557185029Spjd	boolean_t force = (boolean_t)zc->zc_cookie;
1558207670Smm	boolean_t hardforce = (boolean_t)zc->zc_guid;
1559185029Spjd
1560185029Spjd	zfs_log_history(zc);
1561207670Smm	error = spa_export(zc->zc_name, NULL, force, hardforce);
1562219089Spjd	if (error == 0)
1563219089Spjd		zvol_remove_minors(zc->zc_name);
1564185029Spjd	return (error);
1565168404Spjd}
1566168404Spjd
1567168404Spjdstatic int
1568168404Spjdzfs_ioc_pool_configs(zfs_cmd_t *zc)
1569168404Spjd{
1570168404Spjd	nvlist_t *configs;
1571168404Spjd	int error;
1572168404Spjd
1573168404Spjd	if ((configs = spa_all_configs(&zc->zc_cookie)) == NULL)
1574249195Smm		return (SET_ERROR(EEXIST));
1575168404Spjd
1576168404Spjd	error = put_nvlist(zc, configs);
1577168404Spjd
1578168404Spjd	nvlist_free(configs);
1579168404Spjd
1580168404Spjd	return (error);
1581168404Spjd}
1582168404Spjd
1583236884Smm/*
1584236884Smm * inputs:
1585236884Smm * zc_name		name of the pool
1586236884Smm *
1587236884Smm * outputs:
1588236884Smm * zc_cookie		real errno
1589236884Smm * zc_nvlist_dst	config nvlist
1590236884Smm * zc_nvlist_dst_size	size of config nvlist
1591236884Smm */
1592168404Spjdstatic int
1593168404Spjdzfs_ioc_pool_stats(zfs_cmd_t *zc)
1594168404Spjd{
1595168404Spjd	nvlist_t *config;
1596168404Spjd	int error;
1597168404Spjd	int ret = 0;
1598168404Spjd
1599168404Spjd	error = spa_get_stats(zc->zc_name, &config, zc->zc_value,
1600168404Spjd	    sizeof (zc->zc_value));
1601168404Spjd
1602168404Spjd	if (config != NULL) {
1603168404Spjd		ret = put_nvlist(zc, config);
1604168404Spjd		nvlist_free(config);
1605168404Spjd
1606168404Spjd		/*
1607168404Spjd		 * The config may be present even if 'error' is non-zero.
1608168404Spjd		 * In this case we return success, and preserve the real errno
1609168404Spjd		 * in 'zc_cookie'.
1610168404Spjd		 */
1611168404Spjd		zc->zc_cookie = error;
1612168404Spjd	} else {
1613168404Spjd		ret = error;
1614168404Spjd	}
1615168404Spjd
1616168404Spjd	return (ret);
1617168404Spjd}
1618168404Spjd
1619168404Spjd/*
1620168404Spjd * Try to import the given pool, returning pool stats as appropriate so that
1621168404Spjd * user land knows which devices are available and overall pool health.
1622168404Spjd */
1623168404Spjdstatic int
1624168404Spjdzfs_ioc_pool_tryimport(zfs_cmd_t *zc)
1625168404Spjd{
1626168404Spjd	nvlist_t *tryconfig, *config;
1627168404Spjd	int error;
1628168404Spjd
1629185029Spjd	if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1630219089Spjd	    zc->zc_iflags, &tryconfig)) != 0)
1631168404Spjd		return (error);
1632168404Spjd
1633168404Spjd	config = spa_tryimport(tryconfig);
1634168404Spjd
1635168404Spjd	nvlist_free(tryconfig);
1636168404Spjd
1637168404Spjd	if (config == NULL)
1638249195Smm		return (SET_ERROR(EINVAL));
1639168404Spjd
1640168404Spjd	error = put_nvlist(zc, config);
1641168404Spjd	nvlist_free(config);
1642168404Spjd
1643168404Spjd	return (error);
1644168404Spjd}
1645168404Spjd
1646219089Spjd/*
1647219089Spjd * inputs:
1648219089Spjd * zc_name              name of the pool
1649219089Spjd * zc_cookie            scan func (pool_scan_func_t)
1650219089Spjd */
1651168404Spjdstatic int
1652219089Spjdzfs_ioc_pool_scan(zfs_cmd_t *zc)
1653168404Spjd{
1654168404Spjd	spa_t *spa;
1655168404Spjd	int error;
1656168404Spjd
1657168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1658168404Spjd		return (error);
1659168404Spjd
1660219089Spjd	if (zc->zc_cookie == POOL_SCAN_NONE)
1661219089Spjd		error = spa_scan_stop(spa);
1662219089Spjd	else
1663219089Spjd		error = spa_scan(spa, zc->zc_cookie);
1664168404Spjd
1665168404Spjd	spa_close(spa, FTAG);
1666168404Spjd
1667168404Spjd	return (error);
1668168404Spjd}
1669168404Spjd
1670168404Spjdstatic int
1671168404Spjdzfs_ioc_pool_freeze(zfs_cmd_t *zc)
1672168404Spjd{
1673168404Spjd	spa_t *spa;
1674168404Spjd	int error;
1675168404Spjd
1676168404Spjd	error = spa_open(zc->zc_name, &spa, FTAG);
1677168404Spjd	if (error == 0) {
1678168404Spjd		spa_freeze(spa);
1679168404Spjd		spa_close(spa, FTAG);
1680168404Spjd	}
1681168404Spjd	return (error);
1682168404Spjd}
1683168404Spjd
1684168404Spjdstatic int
1685168404Spjdzfs_ioc_pool_upgrade(zfs_cmd_t *zc)
1686168404Spjd{
1687168404Spjd	spa_t *spa;
1688168404Spjd	int error;
1689168404Spjd
1690168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1691168404Spjd		return (error);
1692168404Spjd
1693236884Smm	if (zc->zc_cookie < spa_version(spa) ||
1694236884Smm	    !SPA_VERSION_IS_SUPPORTED(zc->zc_cookie)) {
1695185029Spjd		spa_close(spa, FTAG);
1696249195Smm		return (SET_ERROR(EINVAL));
1697185029Spjd	}
1698168404Spjd
1699185029Spjd	spa_upgrade(spa, zc->zc_cookie);
1700168404Spjd	spa_close(spa, FTAG);
1701168404Spjd
1702168404Spjd	return (error);
1703168404Spjd}
1704168404Spjd
1705168404Spjdstatic int
1706168404Spjdzfs_ioc_pool_get_history(zfs_cmd_t *zc)
1707168404Spjd{
1708168404Spjd	spa_t *spa;
1709168404Spjd	char *hist_buf;
1710168404Spjd	uint64_t size;
1711168404Spjd	int error;
1712168404Spjd
1713168404Spjd	if ((size = zc->zc_history_len) == 0)
1714249195Smm		return (SET_ERROR(EINVAL));
1715168404Spjd
1716168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1717168404Spjd		return (error);
1718168404Spjd
1719185029Spjd	if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
1720168404Spjd		spa_close(spa, FTAG);
1721249195Smm		return (SET_ERROR(ENOTSUP));
1722168404Spjd	}
1723168404Spjd
1724168404Spjd	hist_buf = kmem_alloc(size, KM_SLEEP);
1725168404Spjd	if ((error = spa_history_get(spa, &zc->zc_history_offset,
1726168404Spjd	    &zc->zc_history_len, hist_buf)) == 0) {
1727219089Spjd		error = ddi_copyout(hist_buf,
1728219089Spjd		    (void *)(uintptr_t)zc->zc_history,
1729219089Spjd		    zc->zc_history_len, zc->zc_iflags);
1730168404Spjd	}
1731168404Spjd
1732168404Spjd	spa_close(spa, FTAG);
1733168404Spjd	kmem_free(hist_buf, size);
1734168404Spjd	return (error);
1735168404Spjd}
1736168404Spjd
1737168404Spjdstatic int
1738228103Smmzfs_ioc_pool_reguid(zfs_cmd_t *zc)
1739228103Smm{
1740228103Smm	spa_t *spa;
1741228103Smm	int error;
1742228103Smm
1743228103Smm	error = spa_open(zc->zc_name, &spa, FTAG);
1744228103Smm	if (error == 0) {
1745228103Smm		error = spa_change_guid(spa);
1746228103Smm		spa_close(spa, FTAG);
1747228103Smm	}
1748228103Smm	return (error);
1749228103Smm}
1750228103Smm
1751228103Smmstatic int
1752168404Spjdzfs_ioc_dsobj_to_dsname(zfs_cmd_t *zc)
1753168404Spjd{
1754248571Smm	return (dsl_dsobj_to_dsname(zc->zc_name, zc->zc_obj, zc->zc_value));
1755168404Spjd}
1756168404Spjd
1757219089Spjd/*
1758219089Spjd * inputs:
1759219089Spjd * zc_name		name of filesystem
1760219089Spjd * zc_obj		object to find
1761219089Spjd *
1762219089Spjd * outputs:
1763219089Spjd * zc_value		name of object
1764219089Spjd */
1765168404Spjdstatic int
1766168404Spjdzfs_ioc_obj_to_path(zfs_cmd_t *zc)
1767168404Spjd{
1768219089Spjd	objset_t *os;
1769168404Spjd	int error;
1770168404Spjd
1771219089Spjd	/* XXX reading from objset not owned */
1772219089Spjd	if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1773168404Spjd		return (error);
1774219089Spjd	if (dmu_objset_type(os) != DMU_OST_ZFS) {
1775219089Spjd		dmu_objset_rele(os, FTAG);
1776249195Smm		return (SET_ERROR(EINVAL));
1777219089Spjd	}
1778219089Spjd	error = zfs_obj_to_path(os, zc->zc_obj, zc->zc_value,
1779168404Spjd	    sizeof (zc->zc_value));
1780219089Spjd	dmu_objset_rele(os, FTAG);
1781168404Spjd
1782168404Spjd	return (error);
1783168404Spjd}
1784168404Spjd
1785219089Spjd/*
1786219089Spjd * inputs:
1787219089Spjd * zc_name		name of filesystem
1788219089Spjd * zc_obj		object to find
1789219089Spjd *
1790219089Spjd * outputs:
1791219089Spjd * zc_stat		stats on object
1792219089Spjd * zc_value		path to object
1793219089Spjd */
1794168404Spjdstatic int
1795219089Spjdzfs_ioc_obj_to_stats(zfs_cmd_t *zc)
1796219089Spjd{
1797219089Spjd	objset_t *os;
1798219089Spjd	int error;
1799219089Spjd
1800219089Spjd	/* XXX reading from objset not owned */
1801219089Spjd	if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1802219089Spjd		return (error);
1803219089Spjd	if (dmu_objset_type(os) != DMU_OST_ZFS) {
1804219089Spjd		dmu_objset_rele(os, FTAG);
1805249195Smm		return (SET_ERROR(EINVAL));
1806219089Spjd	}
1807219089Spjd	error = zfs_obj_to_stats(os, zc->zc_obj, &zc->zc_stat, zc->zc_value,
1808219089Spjd	    sizeof (zc->zc_value));
1809219089Spjd	dmu_objset_rele(os, FTAG);
1810219089Spjd
1811219089Spjd	return (error);
1812219089Spjd}
1813219089Spjd
1814219089Spjdstatic int
1815168404Spjdzfs_ioc_vdev_add(zfs_cmd_t *zc)
1816168404Spjd{
1817168404Spjd	spa_t *spa;
1818168404Spjd	int error;
1819185029Spjd	nvlist_t *config, **l2cache, **spares;
1820185029Spjd	uint_t nl2cache = 0, nspares = 0;
1821168404Spjd
1822168404Spjd	error = spa_open(zc->zc_name, &spa, FTAG);
1823168404Spjd	if (error != 0)
1824168404Spjd		return (error);
1825168404Spjd
1826185029Spjd	error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1827219089Spjd	    zc->zc_iflags, &config);
1828185029Spjd	(void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_L2CACHE,
1829185029Spjd	    &l2cache, &nl2cache);
1830185029Spjd
1831185029Spjd	(void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_SPARES,
1832185029Spjd	    &spares, &nspares);
1833185029Spjd
1834168404Spjd	/*
1835168404Spjd	 * A root pool with concatenated devices is not supported.
1836185029Spjd	 * Thus, can not add a device to a root pool.
1837185029Spjd	 *
1838185029Spjd	 * Intent log device can not be added to a rootpool because
1839185029Spjd	 * during mountroot, zil is replayed, a seperated log device
1840185029Spjd	 * can not be accessed during the mountroot time.
1841185029Spjd	 *
1842185029Spjd	 * l2cache and spare devices are ok to be added to a rootpool.
1843168404Spjd	 */
1844219089Spjd	if (spa_bootfs(spa) != 0 && nl2cache == 0 && nspares == 0) {
1845219089Spjd		nvlist_free(config);
1846168404Spjd		spa_close(spa, FTAG);
1847249195Smm		return (SET_ERROR(EDOM));
1848168404Spjd	}
1849168404Spjd
1850185029Spjd	if (error == 0) {
1851168404Spjd		error = spa_vdev_add(spa, config);
1852168404Spjd		nvlist_free(config);
1853168404Spjd	}
1854168404Spjd	spa_close(spa, FTAG);
1855168404Spjd	return (error);
1856168404Spjd}
1857168404Spjd
1858219089Spjd/*
1859219089Spjd * inputs:
1860219089Spjd * zc_name		name of the pool
1861219089Spjd * zc_nvlist_conf	nvlist of devices to remove
1862219089Spjd * zc_cookie		to stop the remove?
1863219089Spjd */
1864168404Spjdstatic int
1865168404Spjdzfs_ioc_vdev_remove(zfs_cmd_t *zc)
1866168404Spjd{
1867168404Spjd	spa_t *spa;
1868168404Spjd	int error;
1869168404Spjd
1870168404Spjd	error = spa_open(zc->zc_name, &spa, FTAG);
1871168404Spjd	if (error != 0)
1872168404Spjd		return (error);
1873168404Spjd	error = spa_vdev_remove(spa, zc->zc_guid, B_FALSE);
1874168404Spjd	spa_close(spa, FTAG);
1875168404Spjd	return (error);
1876168404Spjd}
1877168404Spjd
1878168404Spjdstatic int
1879185029Spjdzfs_ioc_vdev_set_state(zfs_cmd_t *zc)
1880168404Spjd{
1881168404Spjd	spa_t *spa;
1882168404Spjd	int error;
1883185029Spjd	vdev_state_t newstate = VDEV_STATE_UNKNOWN;
1884168404Spjd
1885168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1886168404Spjd		return (error);
1887185029Spjd	switch (zc->zc_cookie) {
1888185029Spjd	case VDEV_STATE_ONLINE:
1889185029Spjd		error = vdev_online(spa, zc->zc_guid, zc->zc_obj, &newstate);
1890185029Spjd		break;
1891168404Spjd
1892185029Spjd	case VDEV_STATE_OFFLINE:
1893185029Spjd		error = vdev_offline(spa, zc->zc_guid, zc->zc_obj);
1894185029Spjd		break;
1895168404Spjd
1896185029Spjd	case VDEV_STATE_FAULTED:
1897219089Spjd		if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1898219089Spjd		    zc->zc_obj != VDEV_AUX_EXTERNAL)
1899219089Spjd			zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1900219089Spjd
1901219089Spjd		error = vdev_fault(spa, zc->zc_guid, zc->zc_obj);
1902185029Spjd		break;
1903185029Spjd
1904185029Spjd	case VDEV_STATE_DEGRADED:
1905219089Spjd		if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1906219089Spjd		    zc->zc_obj != VDEV_AUX_EXTERNAL)
1907219089Spjd			zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1908219089Spjd
1909219089Spjd		error = vdev_degrade(spa, zc->zc_guid, zc->zc_obj);
1910185029Spjd		break;
1911185029Spjd
1912185029Spjd	default:
1913249195Smm		error = SET_ERROR(EINVAL);
1914185029Spjd	}
1915185029Spjd	zc->zc_cookie = newstate;
1916168404Spjd	spa_close(spa, FTAG);
1917168404Spjd	return (error);
1918168404Spjd}
1919168404Spjd
1920168404Spjdstatic int
1921168404Spjdzfs_ioc_vdev_attach(zfs_cmd_t *zc)
1922168404Spjd{
1923168404Spjd	spa_t *spa;
1924168404Spjd	int replacing = zc->zc_cookie;
1925168404Spjd	nvlist_t *config;
1926168404Spjd	int error;
1927168404Spjd
1928168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1929168404Spjd		return (error);
1930168404Spjd
1931185029Spjd	if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1932219089Spjd	    zc->zc_iflags, &config)) == 0) {
1933168404Spjd		error = spa_vdev_attach(spa, zc->zc_guid, config, replacing);
1934168404Spjd		nvlist_free(config);
1935168404Spjd	}
1936168404Spjd
1937168404Spjd	spa_close(spa, FTAG);
1938168404Spjd	return (error);
1939168404Spjd}
1940168404Spjd
1941168404Spjdstatic int
1942168404Spjdzfs_ioc_vdev_detach(zfs_cmd_t *zc)
1943168404Spjd{
1944168404Spjd	spa_t *spa;
1945168404Spjd	int error;
1946168404Spjd
1947168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1948168404Spjd		return (error);
1949168404Spjd
1950209962Smm	error = spa_vdev_detach(spa, zc->zc_guid, 0, B_FALSE);
1951168404Spjd
1952168404Spjd	spa_close(spa, FTAG);
1953168404Spjd	return (error);
1954168404Spjd}
1955168404Spjd
1956168404Spjdstatic int
1957219089Spjdzfs_ioc_vdev_split(zfs_cmd_t *zc)
1958219089Spjd{
1959219089Spjd	spa_t *spa;
1960219089Spjd	nvlist_t *config, *props = NULL;
1961219089Spjd	int error;
1962219089Spjd	boolean_t exp = !!(zc->zc_cookie & ZPOOL_EXPORT_AFTER_SPLIT);
1963219089Spjd
1964219089Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1965219089Spjd		return (error);
1966219089Spjd
1967219089Spjd	if (error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1968219089Spjd	    zc->zc_iflags, &config)) {
1969219089Spjd		spa_close(spa, FTAG);
1970219089Spjd		return (error);
1971219089Spjd	}
1972219089Spjd
1973219089Spjd	if (zc->zc_nvlist_src_size != 0 && (error =
1974219089Spjd	    get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1975219089Spjd	    zc->zc_iflags, &props))) {
1976219089Spjd		spa_close(spa, FTAG);
1977219089Spjd		nvlist_free(config);
1978219089Spjd		return (error);
1979219089Spjd	}
1980219089Spjd
1981219089Spjd	error = spa_vdev_split_mirror(spa, zc->zc_string, config, props, exp);
1982219089Spjd
1983219089Spjd	spa_close(spa, FTAG);
1984219089Spjd
1985219089Spjd	nvlist_free(config);
1986219089Spjd	nvlist_free(props);
1987219089Spjd
1988219089Spjd	return (error);
1989219089Spjd}
1990219089Spjd
1991219089Spjdstatic int
1992168404Spjdzfs_ioc_vdev_setpath(zfs_cmd_t *zc)
1993168404Spjd{
1994168404Spjd	spa_t *spa;
1995168404Spjd	char *path = zc->zc_value;
1996168404Spjd	uint64_t guid = zc->zc_guid;
1997168404Spjd	int error;
1998168404Spjd
1999168404Spjd	error = spa_open(zc->zc_name, &spa, FTAG);
2000168404Spjd	if (error != 0)
2001168404Spjd		return (error);
2002168404Spjd
2003168404Spjd	error = spa_vdev_setpath(spa, guid, path);
2004168404Spjd	spa_close(spa, FTAG);
2005168404Spjd	return (error);
2006168404Spjd}
2007168404Spjd
2008209962Smmstatic int
2009209962Smmzfs_ioc_vdev_setfru(zfs_cmd_t *zc)
2010209962Smm{
2011209962Smm	spa_t *spa;
2012209962Smm	char *fru = zc->zc_value;
2013209962Smm	uint64_t guid = zc->zc_guid;
2014209962Smm	int error;
2015209962Smm
2016209962Smm	error = spa_open(zc->zc_name, &spa, FTAG);
2017209962Smm	if (error != 0)
2018209962Smm		return (error);
2019209962Smm
2020209962Smm	error = spa_vdev_setfru(spa, guid, fru);
2021209962Smm	spa_close(spa, FTAG);
2022209962Smm	return (error);
2023209962Smm}
2024209962Smm
2025219089Spjdstatic int
2026219089Spjdzfs_ioc_objset_stats_impl(zfs_cmd_t *zc, objset_t *os)
2027219089Spjd{
2028219089Spjd	int error = 0;
2029219089Spjd	nvlist_t *nv;
2030219089Spjd
2031219089Spjd	dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2032219089Spjd
2033219089Spjd	if (zc->zc_nvlist_dst != 0 &&
2034219089Spjd	    (error = dsl_prop_get_all(os, &nv)) == 0) {
2035219089Spjd		dmu_objset_stats(os, nv);
2036219089Spjd		/*
2037219089Spjd		 * NB: zvol_get_stats() will read the objset contents,
2038219089Spjd		 * which we aren't supposed to do with a
2039219089Spjd		 * DS_MODE_USER hold, because it could be
2040219089Spjd		 * inconsistent.  So this is a bit of a workaround...
2041219089Spjd		 * XXX reading with out owning
2042219089Spjd		 */
2043228103Smm		if (!zc->zc_objset_stats.dds_inconsistent &&
2044228103Smm		    dmu_objset_type(os) == DMU_OST_ZVOL) {
2045228103Smm			error = zvol_get_stats(os, nv);
2046228103Smm			if (error == EIO)
2047228103Smm				return (error);
2048240415Smm			VERIFY0(error);
2049219089Spjd		}
2050219089Spjd		error = put_nvlist(zc, nv);
2051219089Spjd		nvlist_free(nv);
2052219089Spjd	}
2053219089Spjd
2054219089Spjd	return (error);
2055219089Spjd}
2056219089Spjd
2057185029Spjd/*
2058185029Spjd * inputs:
2059185029Spjd * zc_name		name of filesystem
2060185029Spjd * zc_nvlist_dst_size	size of buffer for property nvlist
2061185029Spjd *
2062185029Spjd * outputs:
2063185029Spjd * zc_objset_stats	stats
2064185029Spjd * zc_nvlist_dst	property nvlist
2065185029Spjd * zc_nvlist_dst_size	size of property nvlist
2066185029Spjd */
2067168404Spjdstatic int
2068168404Spjdzfs_ioc_objset_stats(zfs_cmd_t *zc)
2069168404Spjd{
2070248571Smm	objset_t *os;
2071168404Spjd	int error;
2072219089Spjd
2073248571Smm	error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2074248571Smm	if (error == 0) {
2075248571Smm		error = zfs_ioc_objset_stats_impl(zc, os);
2076248571Smm		dmu_objset_rele(os, FTAG);
2077248571Smm	}
2078219089Spjd
2079219089Spjd	if (error == ENOMEM)
2080219089Spjd		error = 0;
2081219089Spjd	return (error);
2082219089Spjd}
2083219089Spjd
2084219089Spjd/*
2085219089Spjd * inputs:
2086219089Spjd * zc_name		name of filesystem
2087219089Spjd * zc_nvlist_dst_size	size of buffer for property nvlist
2088219089Spjd *
2089219089Spjd * outputs:
2090219089Spjd * zc_nvlist_dst	received property nvlist
2091219089Spjd * zc_nvlist_dst_size	size of received property nvlist
2092219089Spjd *
2093219089Spjd * Gets received properties (distinct from local properties on or after
2094219089Spjd * SPA_VERSION_RECVD_PROPS) for callers who want to differentiate received from
2095219089Spjd * local property values.
2096219089Spjd */
2097219089Spjdstatic int
2098219089Spjdzfs_ioc_objset_recvd_props(zfs_cmd_t *zc)
2099219089Spjd{
2100248571Smm	int error = 0;
2101168404Spjd	nvlist_t *nv;
2102168404Spjd
2103219089Spjd	/*
2104219089Spjd	 * Without this check, we would return local property values if the
2105219089Spjd	 * caller has not already received properties on or after
2106219089Spjd	 * SPA_VERSION_RECVD_PROPS.
2107219089Spjd	 */
2108248571Smm	if (!dsl_prop_get_hasrecvd(zc->zc_name))
2109249195Smm		return (SET_ERROR(ENOTSUP));
2110168404Spjd
2111168404Spjd	if (zc->zc_nvlist_dst != 0 &&
2112248571Smm	    (error = dsl_prop_get_received(zc->zc_name, &nv)) == 0) {
2113168404Spjd		error = put_nvlist(zc, nv);
2114168404Spjd		nvlist_free(nv);
2115168404Spjd	}
2116168404Spjd
2117168404Spjd	return (error);
2118168404Spjd}
2119168404Spjd
2120168404Spjdstatic int
2121185029Spjdnvl_add_zplprop(objset_t *os, nvlist_t *props, zfs_prop_t prop)
2122185029Spjd{
2123185029Spjd	uint64_t value;
2124185029Spjd	int error;
2125185029Spjd
2126185029Spjd	/*
2127185029Spjd	 * zfs_get_zplprop() will either find a value or give us
2128185029Spjd	 * the default value (if there is one).
2129185029Spjd	 */
2130185029Spjd	if ((error = zfs_get_zplprop(os, prop, &value)) != 0)
2131185029Spjd		return (error);
2132185029Spjd	VERIFY(nvlist_add_uint64(props, zfs_prop_to_name(prop), value) == 0);
2133185029Spjd	return (0);
2134185029Spjd}
2135185029Spjd
2136185029Spjd/*
2137185029Spjd * inputs:
2138185029Spjd * zc_name		name of filesystem
2139185029Spjd * zc_nvlist_dst_size	size of buffer for zpl property nvlist
2140185029Spjd *
2141185029Spjd * outputs:
2142185029Spjd * zc_nvlist_dst	zpl property nvlist
2143185029Spjd * zc_nvlist_dst_size	size of zpl property nvlist
2144185029Spjd */
2145185029Spjdstatic int
2146185029Spjdzfs_ioc_objset_zplprops(zfs_cmd_t *zc)
2147185029Spjd{
2148185029Spjd	objset_t *os;
2149185029Spjd	int err;
2150185029Spjd
2151219089Spjd	/* XXX reading without owning */
2152219089Spjd	if (err = dmu_objset_hold(zc->zc_name, FTAG, &os))
2153185029Spjd		return (err);
2154185029Spjd
2155185029Spjd	dmu_objset_fast_stat(os, &zc->zc_objset_stats);
2156185029Spjd
2157185029Spjd	/*
2158185029Spjd	 * NB: nvl_add_zplprop() will read the objset contents,
2159185029Spjd	 * which we aren't supposed to do with a DS_MODE_USER
2160185029Spjd	 * hold, because it could be inconsistent.
2161185029Spjd	 */
2162185029Spjd	if (zc->zc_nvlist_dst != 0 &&
2163185029Spjd	    !zc->zc_objset_stats.dds_inconsistent &&
2164185029Spjd	    dmu_objset_type(os) == DMU_OST_ZFS) {
2165185029Spjd		nvlist_t *nv;
2166185029Spjd
2167185029Spjd		VERIFY(nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2168185029Spjd		if ((err = nvl_add_zplprop(os, nv, ZFS_PROP_VERSION)) == 0 &&
2169185029Spjd		    (err = nvl_add_zplprop(os, nv, ZFS_PROP_NORMALIZE)) == 0 &&
2170185029Spjd		    (err = nvl_add_zplprop(os, nv, ZFS_PROP_UTF8ONLY)) == 0 &&
2171185029Spjd		    (err = nvl_add_zplprop(os, nv, ZFS_PROP_CASE)) == 0)
2172185029Spjd			err = put_nvlist(zc, nv);
2173185029Spjd		nvlist_free(nv);
2174185029Spjd	} else {
2175249195Smm		err = SET_ERROR(ENOENT);
2176185029Spjd	}
2177219089Spjd	dmu_objset_rele(os, FTAG);
2178185029Spjd	return (err);
2179185029Spjd}
2180185029Spjd
2181219089Spjdboolean_t
2182209962Smmdataset_name_hidden(const char *name)
2183209962Smm{
2184209962Smm	/*
2185209962Smm	 * Skip over datasets that are not visible in this zone,
2186209962Smm	 * internal datasets (which have a $ in their name), and
2187209962Smm	 * temporary datasets (which have a % in their name).
2188209962Smm	 */
2189209962Smm	if (strchr(name, '$') != NULL)
2190209962Smm		return (B_TRUE);
2191209962Smm	if (strchr(name, '%') != NULL)
2192209962Smm		return (B_TRUE);
2193209962Smm	if (!INGLOBALZONE(curthread) && !zone_dataset_visible(name, NULL))
2194209962Smm		return (B_TRUE);
2195209962Smm	return (B_FALSE);
2196209962Smm}
2197209962Smm
2198185029Spjd/*
2199185029Spjd * inputs:
2200185029Spjd * zc_name		name of filesystem
2201185029Spjd * zc_cookie		zap cursor
2202185029Spjd * zc_nvlist_dst_size	size of buffer for property nvlist
2203185029Spjd *
2204185029Spjd * outputs:
2205185029Spjd * zc_name		name of next filesystem
2206209962Smm * zc_cookie		zap cursor
2207185029Spjd * zc_objset_stats	stats
2208185029Spjd * zc_nvlist_dst	property nvlist
2209185029Spjd * zc_nvlist_dst_size	size of property nvlist
2210185029Spjd */
2211185029Spjdstatic int
2212168404Spjdzfs_ioc_dataset_list_next(zfs_cmd_t *zc)
2213168404Spjd{
2214168404Spjd	objset_t *os;
2215168404Spjd	int error;
2216168404Spjd	char *p;
2217219089Spjd	size_t orig_len = strlen(zc->zc_name);
2218168404Spjd
2219219089Spjdtop:
2220219089Spjd	if (error = dmu_objset_hold(zc->zc_name, FTAG, &os)) {
2221168404Spjd		if (error == ENOENT)
2222249195Smm			error = SET_ERROR(ESRCH);
2223168404Spjd		return (error);
2224168404Spjd	}
2225168404Spjd
2226168404Spjd	p = strrchr(zc->zc_name, '/');
2227168404Spjd	if (p == NULL || p[1] != '\0')
2228168404Spjd		(void) strlcat(zc->zc_name, "/", sizeof (zc->zc_name));
2229168404Spjd	p = zc->zc_name + strlen(zc->zc_name);
2230168404Spjd
2231168404Spjd	do {
2232168404Spjd		error = dmu_dir_list_next(os,
2233168404Spjd		    sizeof (zc->zc_name) - (p - zc->zc_name), p,
2234168404Spjd		    NULL, &zc->zc_cookie);
2235168404Spjd		if (error == ENOENT)
2236249195Smm			error = SET_ERROR(ESRCH);
2237228103Smm	} while (error == 0 && dataset_name_hidden(zc->zc_name));
2238219089Spjd	dmu_objset_rele(os, FTAG);
2239168404Spjd
2240219089Spjd	/*
2241219089Spjd	 * If it's an internal dataset (ie. with a '$' in its name),
2242219089Spjd	 * don't try to get stats for it, otherwise we'll return ENOENT.
2243219089Spjd	 */
2244219089Spjd	if (error == 0 && strchr(zc->zc_name, '$') == NULL) {
2245168404Spjd		error = zfs_ioc_objset_stats(zc); /* fill in the stats */
2246219089Spjd		if (error == ENOENT) {
2247219089Spjd			/* We lost a race with destroy, get the next one. */
2248219089Spjd			zc->zc_name[orig_len] = '\0';
2249219089Spjd			goto top;
2250219089Spjd		}
2251219089Spjd	}
2252168404Spjd	return (error);
2253168404Spjd}
2254168404Spjd
2255185029Spjd/*
2256185029Spjd * inputs:
2257185029Spjd * zc_name		name of filesystem
2258185029Spjd * zc_cookie		zap cursor
2259185029Spjd * zc_nvlist_dst_size	size of buffer for property nvlist
2260230438Spjd * zc_simple		when set, only name is requested
2261185029Spjd *
2262185029Spjd * outputs:
2263185029Spjd * zc_name		name of next snapshot
2264185029Spjd * zc_objset_stats	stats
2265185029Spjd * zc_nvlist_dst	property nvlist
2266185029Spjd * zc_nvlist_dst_size	size of property nvlist
2267185029Spjd */
2268168404Spjdstatic int
2269168404Spjdzfs_ioc_snapshot_list_next(zfs_cmd_t *zc)
2270168404Spjd{
2271168404Spjd	objset_t *os;
2272168404Spjd	int error;
2273168404Spjd
2274219089Spjd	error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2275248571Smm	if (error != 0) {
2276185029Spjd		return (error == ENOENT ? ESRCH : error);
2277248571Smm	}
2278168404Spjd
2279168404Spjd	/*
2280168404Spjd	 * A dataset name of maximum length cannot have any snapshots,
2281168404Spjd	 * so exit immediately.
2282168404Spjd	 */
2283168404Spjd	if (strlcat(zc->zc_name, "@", sizeof (zc->zc_name)) >= MAXNAMELEN) {
2284219089Spjd		dmu_objset_rele(os, FTAG);
2285249195Smm		return (SET_ERROR(ESRCH));
2286168404Spjd	}
2287168404Spjd
2288168404Spjd	error = dmu_snapshot_list_next(os,
2289168404Spjd	    sizeof (zc->zc_name) - strlen(zc->zc_name),
2290219089Spjd	    zc->zc_name + strlen(zc->zc_name), &zc->zc_obj, &zc->zc_cookie,
2291219089Spjd	    NULL);
2292219089Spjd
2293230438Spjd	if (error == 0 && !zc->zc_simple) {
2294219089Spjd		dsl_dataset_t *ds;
2295219089Spjd		dsl_pool_t *dp = os->os_dsl_dataset->ds_dir->dd_pool;
2296219089Spjd
2297219089Spjd		error = dsl_dataset_hold_obj(dp, zc->zc_obj, FTAG, &ds);
2298248571Smm		if (error == 0) {
2299219089Spjd			objset_t *ossnap;
2300219089Spjd
2301219089Spjd			error = dmu_objset_from_ds(ds, &ossnap);
2302219089Spjd			if (error == 0)
2303219089Spjd				error = zfs_ioc_objset_stats_impl(zc, ossnap);
2304219089Spjd			dsl_dataset_rele(ds, FTAG);
2305219089Spjd		}
2306219089Spjd	} else if (error == ENOENT) {
2307249195Smm		error = SET_ERROR(ESRCH);
2308219089Spjd	}
2309168404Spjd
2310219089Spjd	dmu_objset_rele(os, FTAG);
2311185029Spjd	/* if we failed, undo the @ that we tacked on to zc_name */
2312248571Smm	if (error != 0)
2313185029Spjd		*strchr(zc->zc_name, '@') = '\0';
2314168404Spjd	return (error);
2315168404Spjd}
2316168404Spjd
2317219089Spjdstatic int
2318219089Spjdzfs_prop_set_userquota(const char *dsname, nvpair_t *pair)
2319168404Spjd{
2320219089Spjd	const char *propname = nvpair_name(pair);
2321219089Spjd	uint64_t *valary;
2322219089Spjd	unsigned int vallen;
2323219089Spjd	const char *domain;
2324219089Spjd	char *dash;
2325219089Spjd	zfs_userquota_prop_t type;
2326219089Spjd	uint64_t rid;
2327219089Spjd	uint64_t quota;
2328219089Spjd	zfsvfs_t *zfsvfs;
2329219089Spjd	int err;
2330168404Spjd
2331219089Spjd	if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2332219089Spjd		nvlist_t *attrs;
2333219089Spjd		VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2334219089Spjd		if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2335219089Spjd		    &pair) != 0)
2336249195Smm			return (SET_ERROR(EINVAL));
2337219089Spjd	}
2338219089Spjd
2339185029Spjd	/*
2340219089Spjd	 * A correctly constructed propname is encoded as
2341219089Spjd	 * userquota@<rid>-<domain>.
2342185029Spjd	 */
2343219089Spjd	if ((dash = strchr(propname, '-')) == NULL ||
2344219089Spjd	    nvpair_value_uint64_array(pair, &valary, &vallen) != 0 ||
2345219089Spjd	    vallen != 3)
2346249195Smm		return (SET_ERROR(EINVAL));
2347168404Spjd
2348219089Spjd	domain = dash + 1;
2349219089Spjd	type = valary[0];
2350219089Spjd	rid = valary[1];
2351219089Spjd	quota = valary[2];
2352168404Spjd
2353219089Spjd	err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_FALSE);
2354219089Spjd	if (err == 0) {
2355219089Spjd		err = zfs_set_userquota(zfsvfs, type, domain, rid, quota);
2356219089Spjd		zfsvfs_rele(zfsvfs, FTAG);
2357219089Spjd	}
2358209962Smm
2359219089Spjd	return (err);
2360219089Spjd}
2361168404Spjd
2362219089Spjd/*
2363219089Spjd * If the named property is one that has a special function to set its value,
2364219089Spjd * return 0 on success and a positive error code on failure; otherwise if it is
2365219089Spjd * not one of the special properties handled by this function, return -1.
2366219089Spjd *
2367219089Spjd * XXX: It would be better for callers of the property interface if we handled
2368219089Spjd * these special cases in dsl_prop.c (in the dsl layer).
2369219089Spjd */
2370219089Spjdstatic int
2371219089Spjdzfs_prop_set_special(const char *dsname, zprop_source_t source,
2372219089Spjd    nvpair_t *pair)
2373219089Spjd{
2374219089Spjd	const char *propname = nvpair_name(pair);
2375219089Spjd	zfs_prop_t prop = zfs_name_to_prop(propname);
2376219089Spjd	uint64_t intval;
2377219089Spjd	int err;
2378209962Smm
2379219089Spjd	if (prop == ZPROP_INVAL) {
2380219089Spjd		if (zfs_prop_userquota(propname))
2381219089Spjd			return (zfs_prop_set_userquota(dsname, pair));
2382219089Spjd		return (-1);
2383219089Spjd	}
2384185029Spjd
2385219089Spjd	if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2386219089Spjd		nvlist_t *attrs;
2387219089Spjd		VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2388219089Spjd		VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2389219089Spjd		    &pair) == 0);
2390219089Spjd	}
2391168404Spjd
2392219089Spjd	if (zfs_prop_get_type(prop) == PROP_TYPE_STRING)
2393219089Spjd		return (-1);
2394185029Spjd
2395219089Spjd	VERIFY(0 == nvpair_value_uint64(pair, &intval));
2396185029Spjd
2397219089Spjd	switch (prop) {
2398219089Spjd	case ZFS_PROP_QUOTA:
2399219089Spjd		err = dsl_dir_set_quota(dsname, source, intval);
2400219089Spjd		break;
2401219089Spjd	case ZFS_PROP_REFQUOTA:
2402248571Smm		err = dsl_dataset_set_refquota(dsname, source, intval);
2403219089Spjd		break;
2404219089Spjd	case ZFS_PROP_RESERVATION:
2405219089Spjd		err = dsl_dir_set_reservation(dsname, source, intval);
2406219089Spjd		break;
2407219089Spjd	case ZFS_PROP_REFRESERVATION:
2408248571Smm		err = dsl_dataset_set_refreservation(dsname, source, intval);
2409219089Spjd		break;
2410219089Spjd	case ZFS_PROP_VOLSIZE:
2411219089Spjd		err = zvol_set_volsize(dsname, ddi_driver_major(zfs_dip),
2412219089Spjd		    intval);
2413219089Spjd		break;
2414219089Spjd	case ZFS_PROP_VERSION:
2415219089Spjd	{
2416219089Spjd		zfsvfs_t *zfsvfs;
2417219089Spjd
2418219089Spjd		if ((err = zfsvfs_hold(dsname, FTAG, &zfsvfs, B_TRUE)) != 0)
2419185029Spjd			break;
2420201143Sdelphij
2421219089Spjd		err = zfs_set_version(zfsvfs, intval);
2422219089Spjd		zfsvfs_rele(zfsvfs, FTAG);
2423168404Spjd
2424219089Spjd		if (err == 0 && intval >= ZPL_VERSION_USERSPACE) {
2425219089Spjd			zfs_cmd_t *zc;
2426185029Spjd
2427219089Spjd			zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP);
2428219089Spjd			(void) strcpy(zc->zc_name, dsname);
2429219089Spjd			(void) zfs_ioc_userspace_upgrade(zc);
2430219089Spjd			kmem_free(zc, sizeof (zfs_cmd_t));
2431185029Spjd		}
2432219089Spjd		break;
2433219089Spjd	}
2434246586Sdelphij	case ZFS_PROP_COMPRESSION:
2435246586Sdelphij	{
2436246586Sdelphij		if (intval == ZIO_COMPRESS_LZ4) {
2437246586Sdelphij			zfeature_info_t *feature =
2438246586Sdelphij			    &spa_feature_table[SPA_FEATURE_LZ4_COMPRESS];
2439246586Sdelphij			spa_t *spa;
2440185029Spjd
2441246586Sdelphij			if ((err = spa_open(dsname, &spa, FTAG)) != 0)
2442246586Sdelphij				return (err);
2443246586Sdelphij
2444246586Sdelphij			/*
2445246586Sdelphij			 * Setting the LZ4 compression algorithm activates
2446246586Sdelphij			 * the feature.
2447246586Sdelphij			 */
2448246586Sdelphij			if (!spa_feature_is_active(spa, feature)) {
2449248571Smm				if ((err = zfs_prop_activate_feature(spa,
2450246586Sdelphij				    feature)) != 0) {
2451246586Sdelphij					spa_close(spa, FTAG);
2452246586Sdelphij					return (err);
2453246586Sdelphij				}
2454246586Sdelphij			}
2455246586Sdelphij
2456246586Sdelphij			spa_close(spa, FTAG);
2457246586Sdelphij		}
2458246586Sdelphij		/*
2459246586Sdelphij		 * We still want the default set action to be performed in the
2460246586Sdelphij		 * caller, we only performed zfeature settings here.
2461246586Sdelphij		 */
2462246586Sdelphij		err = -1;
2463246586Sdelphij		break;
2464246586Sdelphij	}
2465246586Sdelphij
2466219089Spjd	default:
2467219089Spjd		err = -1;
2468219089Spjd	}
2469168404Spjd
2470219089Spjd	return (err);
2471219089Spjd}
2472185029Spjd
2473219089Spjd/*
2474219089Spjd * This function is best effort. If it fails to set any of the given properties,
2475248571Smm * it continues to set as many as it can and returns the last error
2476248571Smm * encountered. If the caller provides a non-NULL errlist, it will be filled in
2477248571Smm * with the list of names of all the properties that failed along with the
2478248571Smm * corresponding error numbers.
2479219089Spjd *
2480248571Smm * If every property is set successfully, zero is returned and errlist is not
2481248571Smm * modified.
2482219089Spjd */
2483219089Spjdint
2484219089Spjdzfs_set_prop_nvlist(const char *dsname, zprop_source_t source, nvlist_t *nvl,
2485248571Smm    nvlist_t *errlist)
2486219089Spjd{
2487219089Spjd	nvpair_t *pair;
2488219089Spjd	nvpair_t *propval;
2489219089Spjd	int rv = 0;
2490219089Spjd	uint64_t intval;
2491219089Spjd	char *strval;
2492248571Smm	nvlist_t *genericnvl = fnvlist_alloc();
2493248571Smm	nvlist_t *retrynvl = fnvlist_alloc();
2494168404Spjd
2495219089Spjdretry:
2496219089Spjd	pair = NULL;
2497219089Spjd	while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2498219089Spjd		const char *propname = nvpair_name(pair);
2499219089Spjd		zfs_prop_t prop = zfs_name_to_prop(propname);
2500219089Spjd		int err = 0;
2501185029Spjd
2502219089Spjd		/* decode the property value */
2503219089Spjd		propval = pair;
2504219089Spjd		if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2505219089Spjd			nvlist_t *attrs;
2506248571Smm			attrs = fnvpair_value_nvlist(pair);
2507219089Spjd			if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2508219089Spjd			    &propval) != 0)
2509249195Smm				err = SET_ERROR(EINVAL);
2510219089Spjd		}
2511168404Spjd
2512219089Spjd		/* Validate value type */
2513219089Spjd		if (err == 0 && prop == ZPROP_INVAL) {
2514219089Spjd			if (zfs_prop_user(propname)) {
2515219089Spjd				if (nvpair_type(propval) != DATA_TYPE_STRING)
2516249195Smm					err = SET_ERROR(EINVAL);
2517219089Spjd			} else if (zfs_prop_userquota(propname)) {
2518219089Spjd				if (nvpair_type(propval) !=
2519219089Spjd				    DATA_TYPE_UINT64_ARRAY)
2520249195Smm					err = SET_ERROR(EINVAL);
2521228103Smm			} else {
2522249195Smm				err = SET_ERROR(EINVAL);
2523209962Smm			}
2524219089Spjd		} else if (err == 0) {
2525219089Spjd			if (nvpair_type(propval) == DATA_TYPE_STRING) {
2526219089Spjd				if (zfs_prop_get_type(prop) != PROP_TYPE_STRING)
2527249195Smm					err = SET_ERROR(EINVAL);
2528219089Spjd			} else if (nvpair_type(propval) == DATA_TYPE_UINT64) {
2529168404Spjd				const char *unused;
2530168404Spjd
2531248571Smm				intval = fnvpair_value_uint64(propval);
2532168404Spjd
2533168404Spjd				switch (zfs_prop_get_type(prop)) {
2534185029Spjd				case PROP_TYPE_NUMBER:
2535168404Spjd					break;
2536185029Spjd				case PROP_TYPE_STRING:
2537249195Smm					err = SET_ERROR(EINVAL);
2538219089Spjd					break;
2539185029Spjd				case PROP_TYPE_INDEX:
2540168404Spjd					if (zfs_prop_index_to_string(prop,
2541219089Spjd					    intval, &unused) != 0)
2542249195Smm						err = SET_ERROR(EINVAL);
2543168404Spjd					break;
2544168404Spjd				default:
2545185029Spjd					cmn_err(CE_PANIC,
2546185029Spjd					    "unknown property type");
2547168404Spjd				}
2548168404Spjd			} else {
2549249195Smm				err = SET_ERROR(EINVAL);
2550168404Spjd			}
2551168404Spjd		}
2552219089Spjd
2553219089Spjd		/* Validate permissions */
2554219089Spjd		if (err == 0)
2555219089Spjd			err = zfs_check_settable(dsname, pair, CRED());
2556219089Spjd
2557219089Spjd		if (err == 0) {
2558219089Spjd			err = zfs_prop_set_special(dsname, source, pair);
2559219089Spjd			if (err == -1) {
2560219089Spjd				/*
2561219089Spjd				 * For better performance we build up a list of
2562219089Spjd				 * properties to set in a single transaction.
2563219089Spjd				 */
2564219089Spjd				err = nvlist_add_nvpair(genericnvl, pair);
2565219089Spjd			} else if (err != 0 && nvl != retrynvl) {
2566219089Spjd				/*
2567219089Spjd				 * This may be a spurious error caused by
2568219089Spjd				 * receiving quota and reservation out of order.
2569219089Spjd				 * Try again in a second pass.
2570219089Spjd				 */
2571219089Spjd				err = nvlist_add_nvpair(retrynvl, pair);
2572219089Spjd			}
2573219089Spjd		}
2574219089Spjd
2575248571Smm		if (err != 0) {
2576248571Smm			if (errlist != NULL)
2577248571Smm				fnvlist_add_int32(errlist, propname, err);
2578248571Smm			rv = err;
2579248571Smm		}
2580168404Spjd	}
2581168404Spjd
2582219089Spjd	if (nvl != retrynvl && !nvlist_empty(retrynvl)) {
2583219089Spjd		nvl = retrynvl;
2584219089Spjd		goto retry;
2585209962Smm	}
2586219089Spjd
2587219089Spjd	if (!nvlist_empty(genericnvl) &&
2588219089Spjd	    dsl_props_set(dsname, source, genericnvl) != 0) {
2589219089Spjd		/*
2590219089Spjd		 * If this fails, we still want to set as many properties as we
2591219089Spjd		 * can, so try setting them individually.
2592219089Spjd		 */
2593219089Spjd		pair = NULL;
2594219089Spjd		while ((pair = nvlist_next_nvpair(genericnvl, pair)) != NULL) {
2595219089Spjd			const char *propname = nvpair_name(pair);
2596219089Spjd			int err = 0;
2597219089Spjd
2598219089Spjd			propval = pair;
2599219089Spjd			if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2600219089Spjd				nvlist_t *attrs;
2601248571Smm				attrs = fnvpair_value_nvlist(pair);
2602248571Smm				propval = fnvlist_lookup_nvpair(attrs,
2603248571Smm				    ZPROP_VALUE);
2604219089Spjd			}
2605219089Spjd
2606219089Spjd			if (nvpair_type(propval) == DATA_TYPE_STRING) {
2607248571Smm				strval = fnvpair_value_string(propval);
2608248571Smm				err = dsl_prop_set_string(dsname, propname,
2609248571Smm				    source, strval);
2610219089Spjd			} else {
2611248571Smm				intval = fnvpair_value_uint64(propval);
2612248571Smm				err = dsl_prop_set_int(dsname, propname, source,
2613248571Smm				    intval);
2614219089Spjd			}
2615219089Spjd
2616219089Spjd			if (err != 0) {
2617248571Smm				if (errlist != NULL) {
2618248571Smm					fnvlist_add_int32(errlist, propname,
2619248571Smm					    err);
2620248571Smm				}
2621248571Smm				rv = err;
2622219089Spjd			}
2623219089Spjd		}
2624219089Spjd	}
2625209962Smm	nvlist_free(genericnvl);
2626219089Spjd	nvlist_free(retrynvl);
2627219089Spjd
2628219089Spjd	return (rv);
2629209962Smm}
2630209962Smm
2631209962Smm/*
2632209962Smm * Check that all the properties are valid user properties.
2633209962Smm */
2634209962Smmstatic int
2635248571Smmzfs_check_userprops(const char *fsname, nvlist_t *nvl)
2636209962Smm{
2637219089Spjd	nvpair_t *pair = NULL;
2638209962Smm	int error = 0;
2639209962Smm
2640219089Spjd	while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2641219089Spjd		const char *propname = nvpair_name(pair);
2642209962Smm		char *valstr;
2643209962Smm
2644209962Smm		if (!zfs_prop_user(propname) ||
2645219089Spjd		    nvpair_type(pair) != DATA_TYPE_STRING)
2646249195Smm			return (SET_ERROR(EINVAL));
2647209962Smm
2648209962Smm		if (error = zfs_secpolicy_write_perms(fsname,
2649209962Smm		    ZFS_DELEG_PERM_USERPROP, CRED()))
2650209962Smm			return (error);
2651209962Smm
2652209962Smm		if (strlen(propname) >= ZAP_MAXNAMELEN)
2653249195Smm			return (SET_ERROR(ENAMETOOLONG));
2654209962Smm
2655219089Spjd		VERIFY(nvpair_value_string(pair, &valstr) == 0);
2656209962Smm		if (strlen(valstr) >= ZAP_MAXVALUELEN)
2657209962Smm			return (E2BIG);
2658209962Smm	}
2659168404Spjd	return (0);
2660168404Spjd}
2661168404Spjd
2662219089Spjdstatic void
2663219089Spjdprops_skip(nvlist_t *props, nvlist_t *skipped, nvlist_t **newprops)
2664219089Spjd{
2665219089Spjd	nvpair_t *pair;
2666219089Spjd
2667219089Spjd	VERIFY(nvlist_alloc(newprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2668219089Spjd
2669219089Spjd	pair = NULL;
2670219089Spjd	while ((pair = nvlist_next_nvpair(props, pair)) != NULL) {
2671219089Spjd		if (nvlist_exists(skipped, nvpair_name(pair)))
2672219089Spjd			continue;
2673219089Spjd
2674219089Spjd		VERIFY(nvlist_add_nvpair(*newprops, pair) == 0);
2675219089Spjd	}
2676219089Spjd}
2677219089Spjd
2678219089Spjdstatic int
2679248571Smmclear_received_props(const char *dsname, nvlist_t *props,
2680219089Spjd    nvlist_t *skipped)
2681219089Spjd{
2682219089Spjd	int err = 0;
2683219089Spjd	nvlist_t *cleared_props = NULL;
2684219089Spjd	props_skip(props, skipped, &cleared_props);
2685219089Spjd	if (!nvlist_empty(cleared_props)) {
2686219089Spjd		/*
2687219089Spjd		 * Acts on local properties until the dataset has received
2688219089Spjd		 * properties at least once on or after SPA_VERSION_RECVD_PROPS.
2689219089Spjd		 */
2690219089Spjd		zprop_source_t flags = (ZPROP_SRC_NONE |
2691248571Smm		    (dsl_prop_get_hasrecvd(dsname) ? ZPROP_SRC_RECEIVED : 0));
2692248571Smm		err = zfs_set_prop_nvlist(dsname, flags, cleared_props, NULL);
2693219089Spjd	}
2694219089Spjd	nvlist_free(cleared_props);
2695219089Spjd	return (err);
2696219089Spjd}
2697219089Spjd
2698185029Spjd/*
2699185029Spjd * inputs:
2700185029Spjd * zc_name		name of filesystem
2701209962Smm * zc_value		name of property to set
2702185029Spjd * zc_nvlist_src{_size}	nvlist of properties to apply
2703219089Spjd * zc_cookie		received properties flag
2704185029Spjd *
2705219089Spjd * outputs:
2706219089Spjd * zc_nvlist_dst{_size} error for each unapplied received property
2707185029Spjd */
2708168404Spjdstatic int
2709168404Spjdzfs_ioc_set_prop(zfs_cmd_t *zc)
2710168404Spjd{
2711168404Spjd	nvlist_t *nvl;
2712219089Spjd	boolean_t received = zc->zc_cookie;
2713219089Spjd	zprop_source_t source = (received ? ZPROP_SRC_RECEIVED :
2714219089Spjd	    ZPROP_SRC_LOCAL);
2715248571Smm	nvlist_t *errors;
2716168404Spjd	int error;
2717168404Spjd
2718185029Spjd	if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2719219089Spjd	    zc->zc_iflags, &nvl)) != 0)
2720185029Spjd		return (error);
2721168404Spjd
2722219089Spjd	if (received) {
2723185029Spjd		nvlist_t *origprops;
2724185029Spjd
2725248571Smm		if (dsl_prop_get_received(zc->zc_name, &origprops) == 0) {
2726248571Smm			(void) clear_received_props(zc->zc_name,
2727248571Smm			    origprops, nvl);
2728248571Smm			nvlist_free(origprops);
2729248571Smm		}
2730219089Spjd
2731248571Smm		error = dsl_prop_set_hasrecvd(zc->zc_name);
2732219089Spjd	}
2733185029Spjd
2734248571Smm	errors = fnvlist_alloc();
2735248571Smm	if (error == 0)
2736248571Smm		error = zfs_set_prop_nvlist(zc->zc_name, source, nvl, errors);
2737219089Spjd
2738219089Spjd	if (zc->zc_nvlist_dst != 0 && errors != NULL) {
2739219089Spjd		(void) put_nvlist(zc, errors);
2740168404Spjd	}
2741168404Spjd
2742219089Spjd	nvlist_free(errors);
2743168404Spjd	nvlist_free(nvl);
2744168404Spjd	return (error);
2745168404Spjd}
2746168404Spjd
2747185029Spjd/*
2748185029Spjd * inputs:
2749185029Spjd * zc_name		name of filesystem
2750185029Spjd * zc_value		name of property to inherit
2751219089Spjd * zc_cookie		revert to received value if TRUE
2752185029Spjd *
2753185029Spjd * outputs:		none
2754185029Spjd */
2755168404Spjdstatic int
2756185029Spjdzfs_ioc_inherit_prop(zfs_cmd_t *zc)
2757185029Spjd{
2758219089Spjd	const char *propname = zc->zc_value;
2759219089Spjd	zfs_prop_t prop = zfs_name_to_prop(propname);
2760219089Spjd	boolean_t received = zc->zc_cookie;
2761219089Spjd	zprop_source_t source = (received
2762219089Spjd	    ? ZPROP_SRC_NONE		/* revert to received value, if any */
2763219089Spjd	    : ZPROP_SRC_INHERITED);	/* explicitly inherit */
2764219089Spjd
2765219089Spjd	if (received) {
2766219089Spjd		nvlist_t *dummy;
2767219089Spjd		nvpair_t *pair;
2768219089Spjd		zprop_type_t type;
2769219089Spjd		int err;
2770219089Spjd
2771219089Spjd		/*
2772219089Spjd		 * zfs_prop_set_special() expects properties in the form of an
2773219089Spjd		 * nvpair with type info.
2774219089Spjd		 */
2775219089Spjd		if (prop == ZPROP_INVAL) {
2776219089Spjd			if (!zfs_prop_user(propname))
2777249195Smm				return (SET_ERROR(EINVAL));
2778219089Spjd
2779219089Spjd			type = PROP_TYPE_STRING;
2780219089Spjd		} else if (prop == ZFS_PROP_VOLSIZE ||
2781219089Spjd		    prop == ZFS_PROP_VERSION) {
2782249195Smm			return (SET_ERROR(EINVAL));
2783219089Spjd		} else {
2784219089Spjd			type = zfs_prop_get_type(prop);
2785219089Spjd		}
2786219089Spjd
2787219089Spjd		VERIFY(nvlist_alloc(&dummy, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2788219089Spjd
2789219089Spjd		switch (type) {
2790219089Spjd		case PROP_TYPE_STRING:
2791219089Spjd			VERIFY(0 == nvlist_add_string(dummy, propname, ""));
2792219089Spjd			break;
2793219089Spjd		case PROP_TYPE_NUMBER:
2794219089Spjd		case PROP_TYPE_INDEX:
2795219089Spjd			VERIFY(0 == nvlist_add_uint64(dummy, propname, 0));
2796219089Spjd			break;
2797219089Spjd		default:
2798219089Spjd			nvlist_free(dummy);
2799249195Smm			return (SET_ERROR(EINVAL));
2800219089Spjd		}
2801219089Spjd
2802219089Spjd		pair = nvlist_next_nvpair(dummy, NULL);
2803219089Spjd		err = zfs_prop_set_special(zc->zc_name, source, pair);
2804219089Spjd		nvlist_free(dummy);
2805219089Spjd		if (err != -1)
2806219089Spjd			return (err); /* special property already handled */
2807219089Spjd	} else {
2808219089Spjd		/*
2809219089Spjd		 * Only check this in the non-received case. We want to allow
2810219089Spjd		 * 'inherit -S' to revert non-inheritable properties like quota
2811219089Spjd		 * and reservation to the received or default values even though
2812219089Spjd		 * they are not considered inheritable.
2813219089Spjd		 */
2814219089Spjd		if (prop != ZPROP_INVAL && !zfs_prop_inheritable(prop))
2815249195Smm			return (SET_ERROR(EINVAL));
2816219089Spjd	}
2817219089Spjd
2818248571Smm	/* property name has been validated by zfs_secpolicy_inherit_prop() */
2819248571Smm	return (dsl_prop_inherit(zc->zc_name, zc->zc_value, source));
2820185029Spjd}
2821185029Spjd
2822185029Spjdstatic int
2823169055Spjdzfs_ioc_pool_set_props(zfs_cmd_t *zc)
2824168404Spjd{
2825185029Spjd	nvlist_t *props;
2826168404Spjd	spa_t *spa;
2827185029Spjd	int error;
2828219089Spjd	nvpair_t *pair;
2829168404Spjd
2830219089Spjd	if (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2831219089Spjd	    zc->zc_iflags, &props))
2832168404Spjd		return (error);
2833168404Spjd
2834209962Smm	/*
2835209962Smm	 * If the only property is the configfile, then just do a spa_lookup()
2836209962Smm	 * to handle the faulted case.
2837209962Smm	 */
2838219089Spjd	pair = nvlist_next_nvpair(props, NULL);
2839219089Spjd	if (pair != NULL && strcmp(nvpair_name(pair),
2840209962Smm	    zpool_prop_to_name(ZPOOL_PROP_CACHEFILE)) == 0 &&
2841219089Spjd	    nvlist_next_nvpair(props, pair) == NULL) {
2842209962Smm		mutex_enter(&spa_namespace_lock);
2843209962Smm		if ((spa = spa_lookup(zc->zc_name)) != NULL) {
2844209962Smm			spa_configfile_set(spa, props, B_FALSE);
2845209962Smm			spa_config_sync(spa, B_FALSE, B_TRUE);
2846209962Smm		}
2847209962Smm		mutex_exit(&spa_namespace_lock);
2848219089Spjd		if (spa != NULL) {
2849219089Spjd			nvlist_free(props);
2850209962Smm			return (0);
2851219089Spjd		}
2852209962Smm	}
2853209962Smm
2854168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2855185029Spjd		nvlist_free(props);
2856168404Spjd		return (error);
2857168404Spjd	}
2858168404Spjd
2859185029Spjd	error = spa_prop_set(spa, props);
2860168404Spjd
2861185029Spjd	nvlist_free(props);
2862168404Spjd	spa_close(spa, FTAG);
2863168404Spjd
2864168404Spjd	return (error);
2865168404Spjd}
2866168404Spjd
2867168404Spjdstatic int
2868169055Spjdzfs_ioc_pool_get_props(zfs_cmd_t *zc)
2869168404Spjd{
2870168404Spjd	spa_t *spa;
2871168404Spjd	int error;
2872168404Spjd	nvlist_t *nvp = NULL;
2873168404Spjd
2874209962Smm	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2875209962Smm		/*
2876209962Smm		 * If the pool is faulted, there may be properties we can still
2877209962Smm		 * get (such as altroot and cachefile), so attempt to get them
2878209962Smm		 * anyway.
2879209962Smm		 */
2880209962Smm		mutex_enter(&spa_namespace_lock);
2881209962Smm		if ((spa = spa_lookup(zc->zc_name)) != NULL)
2882209962Smm			error = spa_prop_get(spa, &nvp);
2883209962Smm		mutex_exit(&spa_namespace_lock);
2884209962Smm	} else {
2885209962Smm		error = spa_prop_get(spa, &nvp);
2886209962Smm		spa_close(spa, FTAG);
2887209962Smm	}
2888168404Spjd
2889168404Spjd	if (error == 0 && zc->zc_nvlist_dst != 0)
2890168404Spjd		error = put_nvlist(zc, nvp);
2891168404Spjd	else
2892249195Smm		error = SET_ERROR(EFAULT);
2893168404Spjd
2894209962Smm	nvlist_free(nvp);
2895168404Spjd	return (error);
2896168404Spjd}
2897168404Spjd
2898185029Spjd/*
2899185029Spjd * inputs:
2900185029Spjd * zc_name		name of filesystem
2901185029Spjd * zc_nvlist_src{_size}	nvlist of delegated permissions
2902185029Spjd * zc_perm_action	allow/unallow flag
2903185029Spjd *
2904185029Spjd * outputs:		none
2905185029Spjd */
2906185029Spjdstatic int
2907185029Spjdzfs_ioc_set_fsacl(zfs_cmd_t *zc)
2908185029Spjd{
2909185029Spjd	int error;
2910185029Spjd	nvlist_t *fsaclnv = NULL;
2911185029Spjd
2912185029Spjd	if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2913219089Spjd	    zc->zc_iflags, &fsaclnv)) != 0)
2914185029Spjd		return (error);
2915185029Spjd
2916185029Spjd	/*
2917185029Spjd	 * Verify nvlist is constructed correctly
2918185029Spjd	 */
2919185029Spjd	if ((error = zfs_deleg_verify_nvlist(fsaclnv)) != 0) {
2920185029Spjd		nvlist_free(fsaclnv);
2921249195Smm		return (SET_ERROR(EINVAL));
2922185029Spjd	}
2923185029Spjd
2924185029Spjd	/*
2925185029Spjd	 * If we don't have PRIV_SYS_MOUNT, then validate
2926185029Spjd	 * that user is allowed to hand out each permission in
2927185029Spjd	 * the nvlist(s)
2928185029Spjd	 */
2929185029Spjd
2930185029Spjd	error = secpolicy_zfs(CRED());
2931248571Smm	if (error != 0) {
2932185029Spjd		if (zc->zc_perm_action == B_FALSE) {
2933185029Spjd			error = dsl_deleg_can_allow(zc->zc_name,
2934185029Spjd			    fsaclnv, CRED());
2935185029Spjd		} else {
2936185029Spjd			error = dsl_deleg_can_unallow(zc->zc_name,
2937185029Spjd			    fsaclnv, CRED());
2938185029Spjd		}
2939185029Spjd	}
2940185029Spjd
2941185029Spjd	if (error == 0)
2942185029Spjd		error = dsl_deleg_set(zc->zc_name, fsaclnv, zc->zc_perm_action);
2943185029Spjd
2944185029Spjd	nvlist_free(fsaclnv);
2945185029Spjd	return (error);
2946185029Spjd}
2947185029Spjd
2948185029Spjd/*
2949185029Spjd * inputs:
2950185029Spjd * zc_name		name of filesystem
2951185029Spjd *
2952185029Spjd * outputs:
2953185029Spjd * zc_nvlist_src{_size}	nvlist of delegated permissions
2954185029Spjd */
2955185029Spjdstatic int
2956185029Spjdzfs_ioc_get_fsacl(zfs_cmd_t *zc)
2957185029Spjd{
2958185029Spjd	nvlist_t *nvp;
2959185029Spjd	int error;
2960185029Spjd
2961185029Spjd	if ((error = dsl_deleg_get(zc->zc_name, &nvp)) == 0) {
2962185029Spjd		error = put_nvlist(zc, nvp);
2963185029Spjd		nvlist_free(nvp);
2964185029Spjd	}
2965185029Spjd
2966185029Spjd	return (error);
2967185029Spjd}
2968185029Spjd
2969185029Spjd/*
2970168404Spjd * Search the vfs list for a specified resource.  Returns a pointer to it
2971168404Spjd * or NULL if no suitable entry is found. The caller of this routine
2972168404Spjd * is responsible for releasing the returned vfs pointer.
2973168404Spjd */
2974168404Spjdstatic vfs_t *
2975168404Spjdzfs_get_vfs(const char *resource)
2976168404Spjd{
2977168404Spjd	vfs_t *vfsp;
2978168404Spjd
2979168404Spjd	mtx_lock(&mountlist_mtx);
2980168404Spjd	TAILQ_FOREACH(vfsp, &mountlist, mnt_list) {
2981185029Spjd		if (strcmp(refstr_value(vfsp->vfs_resource), resource) == 0) {
2982168404Spjd			VFS_HOLD(vfsp);
2983168404Spjd			break;
2984168404Spjd		}
2985168404Spjd	}
2986168404Spjd	mtx_unlock(&mountlist_mtx);
2987168404Spjd	return (vfsp);
2988168404Spjd}
2989168404Spjd
2990185029Spjd/* ARGSUSED */
2991168404Spjdstatic void
2992185029Spjdzfs_create_cb(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx)
2993168404Spjd{
2994185029Spjd	zfs_creat_t *zct = arg;
2995168404Spjd
2996185029Spjd	zfs_create_fs(os, cr, zct->zct_zplprops, tx);
2997168404Spjd}
2998168404Spjd
2999185029Spjd#define	ZFS_PROP_UNDEFINED	((uint64_t)-1)
3000185029Spjd
3001185029Spjd/*
3002185029Spjd * inputs:
3003185029Spjd * createprops		list of properties requested by creator
3004185029Spjd * default_zplver	zpl version to use if unspecified in createprops
3005185029Spjd * fuids_ok		fuids allowed in this version of the spa?
3006185029Spjd * os			parent objset pointer (NULL if root fs)
3007185029Spjd *
3008185029Spjd * outputs:
3009185029Spjd * zplprops	values for the zplprops we attach to the master node object
3010185029Spjd * is_ci	true if requested file system will be purely case-insensitive
3011185029Spjd *
3012185029Spjd * Determine the settings for utf8only, normalization and
3013185029Spjd * casesensitivity.  Specific values may have been requested by the
3014185029Spjd * creator and/or we can inherit values from the parent dataset.  If
3015185029Spjd * the file system is of too early a vintage, a creator can not
3016185029Spjd * request settings for these properties, even if the requested
3017185029Spjd * setting is the default value.  We don't actually want to create dsl
3018185029Spjd * properties for these, so remove them from the source nvlist after
3019185029Spjd * processing.
3020185029Spjd */
3021168404Spjdstatic int
3022209962Smmzfs_fill_zplprops_impl(objset_t *os, uint64_t zplver,
3023219089Spjd    boolean_t fuids_ok, boolean_t sa_ok, nvlist_t *createprops,
3024219089Spjd    nvlist_t *zplprops, boolean_t *is_ci)
3025185029Spjd{
3026185029Spjd	uint64_t sense = ZFS_PROP_UNDEFINED;
3027185029Spjd	uint64_t norm = ZFS_PROP_UNDEFINED;
3028185029Spjd	uint64_t u8 = ZFS_PROP_UNDEFINED;
3029185029Spjd
3030185029Spjd	ASSERT(zplprops != NULL);
3031185029Spjd
3032185029Spjd	/*
3033185029Spjd	 * Pull out creator prop choices, if any.
3034185029Spjd	 */
3035185029Spjd	if (createprops) {
3036185029Spjd		(void) nvlist_lookup_uint64(createprops,
3037185029Spjd		    zfs_prop_to_name(ZFS_PROP_VERSION), &zplver);
3038185029Spjd		(void) nvlist_lookup_uint64(createprops,
3039185029Spjd		    zfs_prop_to_name(ZFS_PROP_NORMALIZE), &norm);
3040185029Spjd		(void) nvlist_remove_all(createprops,
3041185029Spjd		    zfs_prop_to_name(ZFS_PROP_NORMALIZE));
3042185029Spjd		(void) nvlist_lookup_uint64(createprops,
3043185029Spjd		    zfs_prop_to_name(ZFS_PROP_UTF8ONLY), &u8);
3044185029Spjd		(void) nvlist_remove_all(createprops,
3045185029Spjd		    zfs_prop_to_name(ZFS_PROP_UTF8ONLY));
3046185029Spjd		(void) nvlist_lookup_uint64(createprops,
3047185029Spjd		    zfs_prop_to_name(ZFS_PROP_CASE), &sense);
3048185029Spjd		(void) nvlist_remove_all(createprops,
3049185029Spjd		    zfs_prop_to_name(ZFS_PROP_CASE));
3050185029Spjd	}
3051185029Spjd
3052185029Spjd	/*
3053185029Spjd	 * If the zpl version requested is whacky or the file system
3054185029Spjd	 * or pool is version is too "young" to support normalization
3055185029Spjd	 * and the creator tried to set a value for one of the props,
3056185029Spjd	 * error out.
3057185029Spjd	 */
3058185029Spjd	if ((zplver < ZPL_VERSION_INITIAL || zplver > ZPL_VERSION) ||
3059185029Spjd	    (zplver >= ZPL_VERSION_FUID && !fuids_ok) ||
3060219089Spjd	    (zplver >= ZPL_VERSION_SA && !sa_ok) ||
3061185029Spjd	    (zplver < ZPL_VERSION_NORMALIZATION &&
3062185029Spjd	    (norm != ZFS_PROP_UNDEFINED || u8 != ZFS_PROP_UNDEFINED ||
3063185029Spjd	    sense != ZFS_PROP_UNDEFINED)))
3064249195Smm		return (SET_ERROR(ENOTSUP));
3065185029Spjd
3066185029Spjd	/*
3067185029Spjd	 * Put the version in the zplprops
3068185029Spjd	 */
3069185029Spjd	VERIFY(nvlist_add_uint64(zplprops,
3070185029Spjd	    zfs_prop_to_name(ZFS_PROP_VERSION), zplver) == 0);
3071185029Spjd
3072185029Spjd	if (norm == ZFS_PROP_UNDEFINED)
3073185029Spjd		VERIFY(zfs_get_zplprop(os, ZFS_PROP_NORMALIZE, &norm) == 0);
3074185029Spjd	VERIFY(nvlist_add_uint64(zplprops,
3075185029Spjd	    zfs_prop_to_name(ZFS_PROP_NORMALIZE), norm) == 0);
3076185029Spjd
3077185029Spjd	/*
3078185029Spjd	 * If we're normalizing, names must always be valid UTF-8 strings.
3079185029Spjd	 */
3080185029Spjd	if (norm)
3081185029Spjd		u8 = 1;
3082185029Spjd	if (u8 == ZFS_PROP_UNDEFINED)
3083185029Spjd		VERIFY(zfs_get_zplprop(os, ZFS_PROP_UTF8ONLY, &u8) == 0);
3084185029Spjd	VERIFY(nvlist_add_uint64(zplprops,
3085185029Spjd	    zfs_prop_to_name(ZFS_PROP_UTF8ONLY), u8) == 0);
3086185029Spjd
3087185029Spjd	if (sense == ZFS_PROP_UNDEFINED)
3088185029Spjd		VERIFY(zfs_get_zplprop(os, ZFS_PROP_CASE, &sense) == 0);
3089185029Spjd	VERIFY(nvlist_add_uint64(zplprops,
3090185029Spjd	    zfs_prop_to_name(ZFS_PROP_CASE), sense) == 0);
3091185029Spjd
3092185029Spjd	if (is_ci)
3093185029Spjd		*is_ci = (sense == ZFS_CASE_INSENSITIVE);
3094185029Spjd
3095185029Spjd	return (0);
3096185029Spjd}
3097185029Spjd
3098185029Spjdstatic int
3099185029Spjdzfs_fill_zplprops(const char *dataset, nvlist_t *createprops,
3100185029Spjd    nvlist_t *zplprops, boolean_t *is_ci)
3101185029Spjd{
3102219089Spjd	boolean_t fuids_ok, sa_ok;
3103185029Spjd	uint64_t zplver = ZPL_VERSION;
3104185029Spjd	objset_t *os = NULL;
3105185029Spjd	char parentname[MAXNAMELEN];
3106185029Spjd	char *cp;
3107219089Spjd	spa_t *spa;
3108219089Spjd	uint64_t spa_vers;
3109185029Spjd	int error;
3110185029Spjd
3111185029Spjd	(void) strlcpy(parentname, dataset, sizeof (parentname));
3112185029Spjd	cp = strrchr(parentname, '/');
3113185029Spjd	ASSERT(cp != NULL);
3114185029Spjd	cp[0] = '\0';
3115185029Spjd
3116219089Spjd	if ((error = spa_open(dataset, &spa, FTAG)) != 0)
3117219089Spjd		return (error);
3118185029Spjd
3119219089Spjd	spa_vers = spa_version(spa);
3120219089Spjd	spa_close(spa, FTAG);
3121219089Spjd
3122219089Spjd	zplver = zfs_zpl_version_map(spa_vers);
3123219089Spjd	fuids_ok = (zplver >= ZPL_VERSION_FUID);
3124219089Spjd	sa_ok = (zplver >= ZPL_VERSION_SA);
3125219089Spjd
3126185029Spjd	/*
3127185029Spjd	 * Open parent object set so we can inherit zplprop values.
3128185029Spjd	 */
3129219089Spjd	if ((error = dmu_objset_hold(parentname, FTAG, &os)) != 0)
3130185029Spjd		return (error);
3131185029Spjd
3132219089Spjd	error = zfs_fill_zplprops_impl(os, zplver, fuids_ok, sa_ok, createprops,
3133185029Spjd	    zplprops, is_ci);
3134219089Spjd	dmu_objset_rele(os, FTAG);
3135185029Spjd	return (error);
3136185029Spjd}
3137185029Spjd
3138185029Spjdstatic int
3139185029Spjdzfs_fill_zplprops_root(uint64_t spa_vers, nvlist_t *createprops,
3140185029Spjd    nvlist_t *zplprops, boolean_t *is_ci)
3141185029Spjd{
3142219089Spjd	boolean_t fuids_ok;
3143219089Spjd	boolean_t sa_ok;
3144185029Spjd	uint64_t zplver = ZPL_VERSION;
3145185029Spjd	int error;
3146185029Spjd
3147219089Spjd	zplver = zfs_zpl_version_map(spa_vers);
3148219089Spjd	fuids_ok = (zplver >= ZPL_VERSION_FUID);
3149219089Spjd	sa_ok = (zplver >= ZPL_VERSION_SA);
3150185029Spjd
3151219089Spjd	error = zfs_fill_zplprops_impl(NULL, zplver, fuids_ok, sa_ok,
3152219089Spjd	    createprops, zplprops, is_ci);
3153185029Spjd	return (error);
3154185029Spjd}
3155185029Spjd
3156185029Spjd/*
3157248571Smm * innvl: {
3158248571Smm *     "type" -> dmu_objset_type_t (int32)
3159248571Smm *     (optional) "props" -> { prop -> value }
3160248571Smm * }
3161185029Spjd *
3162248571Smm * outnvl: propname -> error code (int32)
3163185029Spjd */
3164185029Spjdstatic int
3165248571Smmzfs_ioc_create(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3166168404Spjd{
3167168404Spjd	int error = 0;
3168248571Smm	zfs_creat_t zct = { 0 };
3169185029Spjd	nvlist_t *nvprops = NULL;
3170185029Spjd	void (*cbfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx);
3171248571Smm	int32_t type32;
3172248571Smm	dmu_objset_type_t type;
3173248571Smm	boolean_t is_insensitive = B_FALSE;
3174168404Spjd
3175248571Smm	if (nvlist_lookup_int32(innvl, "type", &type32) != 0)
3176249195Smm		return (SET_ERROR(EINVAL));
3177248571Smm	type = type32;
3178248571Smm	(void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3179248571Smm
3180168404Spjd	switch (type) {
3181168404Spjd	case DMU_OST_ZFS:
3182168404Spjd		cbfunc = zfs_create_cb;
3183168404Spjd		break;
3184168404Spjd
3185168404Spjd	case DMU_OST_ZVOL:
3186168404Spjd		cbfunc = zvol_create_cb;
3187168404Spjd		break;
3188168404Spjd
3189168404Spjd	default:
3190168404Spjd		cbfunc = NULL;
3191185029Spjd		break;
3192168404Spjd	}
3193248571Smm	if (strchr(fsname, '@') ||
3194248571Smm	    strchr(fsname, '%'))
3195249195Smm		return (SET_ERROR(EINVAL));
3196168404Spjd
3197185029Spjd	zct.zct_props = nvprops;
3198168404Spjd
3199248571Smm	if (cbfunc == NULL)
3200249195Smm		return (SET_ERROR(EINVAL));
3201168404Spjd
3202248571Smm	if (type == DMU_OST_ZVOL) {
3203248571Smm		uint64_t volsize, volblocksize;
3204185029Spjd
3205248571Smm		if (nvprops == NULL)
3206249195Smm			return (SET_ERROR(EINVAL));
3207248571Smm		if (nvlist_lookup_uint64(nvprops,
3208248571Smm		    zfs_prop_to_name(ZFS_PROP_VOLSIZE), &volsize) != 0)
3209249195Smm			return (SET_ERROR(EINVAL));
3210185029Spjd
3211248571Smm		if ((error = nvlist_lookup_uint64(nvprops,
3212248571Smm		    zfs_prop_to_name(ZFS_PROP_VOLBLOCKSIZE),
3213248571Smm		    &volblocksize)) != 0 && error != ENOENT)
3214249195Smm			return (SET_ERROR(EINVAL));
3215168404Spjd
3216248571Smm		if (error != 0)
3217248571Smm			volblocksize = zfs_prop_default_numeric(
3218248571Smm			    ZFS_PROP_VOLBLOCKSIZE);
3219168404Spjd
3220248571Smm		if ((error = zvol_check_volblocksize(
3221248571Smm		    volblocksize)) != 0 ||
3222248571Smm		    (error = zvol_check_volsize(volsize,
3223248571Smm		    volblocksize)) != 0)
3224248571Smm			return (error);
3225248571Smm	} else if (type == DMU_OST_ZFS) {
3226248571Smm		int error;
3227168404Spjd
3228248571Smm		/*
3229248571Smm		 * We have to have normalization and
3230248571Smm		 * case-folding flags correct when we do the
3231248571Smm		 * file system creation, so go figure them out
3232248571Smm		 * now.
3233248571Smm		 */
3234248571Smm		VERIFY(nvlist_alloc(&zct.zct_zplprops,
3235248571Smm		    NV_UNIQUE_NAME, KM_SLEEP) == 0);
3236248571Smm		error = zfs_fill_zplprops(fsname, nvprops,
3237248571Smm		    zct.zct_zplprops, &is_insensitive);
3238248571Smm		if (error != 0) {
3239248571Smm			nvlist_free(zct.zct_zplprops);
3240248571Smm			return (error);
3241168404Spjd		}
3242168404Spjd	}
3243168404Spjd
3244248571Smm	error = dmu_objset_create(fsname, type,
3245248571Smm	    is_insensitive ? DS_FLAG_CI_DATASET : 0, cbfunc, &zct);
3246248571Smm	nvlist_free(zct.zct_zplprops);
3247248571Smm
3248168404Spjd	/*
3249168404Spjd	 * It would be nice to do this atomically.
3250168404Spjd	 */
3251168404Spjd	if (error == 0) {
3252248571Smm		error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3253248571Smm		    nvprops, outnvl);
3254219089Spjd		if (error != 0)
3255248571Smm			(void) dsl_destroy_head(fsname);
3256168404Spjd	}
3257219089Spjd#ifdef __FreeBSD__
3258219089Spjd	if (error == 0 && type == DMU_OST_ZVOL)
3259248571Smm		zvol_create_minors(fsname);
3260219089Spjd#endif
3261168404Spjd	return (error);
3262168404Spjd}
3263168404Spjd
3264185029Spjd/*
3265248571Smm * innvl: {
3266248571Smm *     "origin" -> name of origin snapshot
3267248571Smm *     (optional) "props" -> { prop -> value }
3268248571Smm * }
3269185029Spjd *
3270248571Smm * outnvl: propname -> error code (int32)
3271185029Spjd */
3272185029Spjdstatic int
3273248571Smmzfs_ioc_clone(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
3274168404Spjd{
3275248571Smm	int error = 0;
3276185029Spjd	nvlist_t *nvprops = NULL;
3277248571Smm	char *origin_name;
3278185029Spjd
3279248571Smm	if (nvlist_lookup_string(innvl, "origin", &origin_name) != 0)
3280249195Smm		return (SET_ERROR(EINVAL));
3281248571Smm	(void) nvlist_lookup_nvlist(innvl, "props", &nvprops);
3282185029Spjd
3283248571Smm	if (strchr(fsname, '@') ||
3284248571Smm	    strchr(fsname, '%'))
3285249195Smm		return (SET_ERROR(EINVAL));
3286248571Smm
3287248571Smm	if (dataset_namecheck(origin_name, NULL, NULL) != 0)
3288249195Smm		return (SET_ERROR(EINVAL));
3289248571Smm	error = dmu_objset_clone(fsname, origin_name);
3290248571Smm	if (error != 0)
3291185029Spjd		return (error);
3292185029Spjd
3293248571Smm	/*
3294248571Smm	 * It would be nice to do this atomically.
3295248571Smm	 */
3296248571Smm	if (error == 0) {
3297248571Smm		error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
3298248571Smm		    nvprops, outnvl);
3299248571Smm		if (error != 0)
3300248571Smm			(void) dsl_destroy_head(fsname);
3301248571Smm	}
3302248571Smm	return (error);
3303248571Smm}
3304185029Spjd
3305248571Smm/*
3306248571Smm * innvl: {
3307248571Smm *     "snaps" -> { snapshot1, snapshot2 }
3308248571Smm *     (optional) "props" -> { prop -> value (string) }
3309248571Smm * }
3310248571Smm *
3311248571Smm * outnvl: snapshot -> error code (int32)
3312248571Smm */
3313248571Smmstatic int
3314248571Smmzfs_ioc_snapshot(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3315248571Smm{
3316248571Smm	nvlist_t *snaps;
3317248571Smm	nvlist_t *props = NULL;
3318248571Smm	int error, poollen;
3319248571Smm	nvpair_t *pair;
3320248571Smm
3321248571Smm	(void) nvlist_lookup_nvlist(innvl, "props", &props);
3322248571Smm	if ((error = zfs_check_userprops(poolname, props)) != 0)
3323248571Smm		return (error);
3324248571Smm
3325248571Smm	if (!nvlist_empty(props) &&
3326248571Smm	    zfs_earlier_version(poolname, SPA_VERSION_SNAP_PROPS))
3327249195Smm		return (SET_ERROR(ENOTSUP));
3328248571Smm
3329248571Smm	if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3330249195Smm		return (SET_ERROR(EINVAL));
3331248571Smm	poollen = strlen(poolname);
3332248571Smm	for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3333248571Smm	    pair = nvlist_next_nvpair(snaps, pair)) {
3334248571Smm		const char *name = nvpair_name(pair);
3335248571Smm		const char *cp = strchr(name, '@');
3336248571Smm
3337248571Smm		/*
3338248571Smm		 * The snap name must contain an @, and the part after it must
3339248571Smm		 * contain only valid characters.
3340248571Smm		 */
3341248571Smm		if (cp == NULL || snapshot_namecheck(cp + 1, NULL, NULL) != 0)
3342249195Smm			return (SET_ERROR(EINVAL));
3343248571Smm
3344248571Smm		/*
3345248571Smm		 * The snap must be in the specified pool.
3346248571Smm		 */
3347248571Smm		if (strncmp(name, poolname, poollen) != 0 ||
3348248571Smm		    (name[poollen] != '/' && name[poollen] != '@'))
3349249195Smm			return (SET_ERROR(EXDEV));
3350248571Smm
3351248571Smm		/* This must be the only snap of this fs. */
3352248571Smm		for (nvpair_t *pair2 = nvlist_next_nvpair(snaps, pair);
3353248571Smm		    pair2 != NULL; pair2 = nvlist_next_nvpair(snaps, pair2)) {
3354248571Smm			if (strncmp(name, nvpair_name(pair2), cp - name + 1)
3355248571Smm			    == 0) {
3356249195Smm				return (SET_ERROR(EXDEV));
3357248571Smm			}
3358248571Smm		}
3359185029Spjd	}
3360209962Smm
3361248571Smm	error = dsl_dataset_snapshot(snaps, props, outnvl);
3362185029Spjd	return (error);
3363168404Spjd}
3364168404Spjd
3365248571Smm/*
3366248571Smm * innvl: "message" -> string
3367248571Smm */
3368248571Smm/* ARGSUSED */
3369248571Smmstatic int
3370248571Smmzfs_ioc_log_history(const char *unused, nvlist_t *innvl, nvlist_t *outnvl)
3371168404Spjd{
3372248571Smm	char *message;
3373248571Smm	spa_t *spa;
3374248571Smm	int error;
3375248571Smm	char *poolname;
3376168404Spjd
3377248571Smm	/*
3378248571Smm	 * The poolname in the ioctl is not set, we get it from the TSD,
3379248571Smm	 * which was set at the end of the last successful ioctl that allows
3380248571Smm	 * logging.  The secpolicy func already checked that it is set.
3381248571Smm	 * Only one log ioctl is allowed after each successful ioctl, so
3382248571Smm	 * we clear the TSD here.
3383248571Smm	 */
3384248571Smm	poolname = tsd_get(zfs_allow_log_key);
3385248571Smm	(void) tsd_set(zfs_allow_log_key, NULL);
3386248571Smm	error = spa_open(poolname, &spa, FTAG);
3387248571Smm	strfree(poolname);
3388248571Smm	if (error != 0)
3389248571Smm		return (error);
3390248571Smm
3391248571Smm	if (nvlist_lookup_string(innvl, "message", &message) != 0)  {
3392248571Smm		spa_close(spa, FTAG);
3393249195Smm		return (SET_ERROR(EINVAL));
3394168404Spjd	}
3395168404Spjd
3396248571Smm	if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
3397248571Smm		spa_close(spa, FTAG);
3398249195Smm		return (SET_ERROR(ENOTSUP));
3399248571Smm	}
3400168404Spjd
3401248571Smm	error = spa_history_log(spa, message);
3402248571Smm	spa_close(spa, FTAG);
3403248571Smm	return (error);
3404248571Smm}
3405248571Smm
3406248571Smm/*
3407248571Smm * The dp_config_rwlock must not be held when calling this, because the
3408248571Smm * unmount may need to write out data.
3409248571Smm *
3410248571Smm * This function is best-effort.  Callers must deal gracefully if it
3411248571Smm * remains mounted (or is remounted after this call).
3412248571Smm */
3413248571Smmvoid
3414248571Smmzfs_unmount_snap(const char *snapname)
3415248571Smm{
3416248571Smm	vfs_t *vfsp;
3417248571Smm	zfsvfs_t *zfsvfs;
3418248571Smm
3419248571Smm	if (strchr(snapname, '@') == NULL)
3420248571Smm		return;
3421248571Smm
3422248571Smm	vfsp = zfs_get_vfs(snapname);
3423248571Smm	if (vfsp == NULL)
3424248571Smm		return;
3425248571Smm
3426248571Smm	zfsvfs = vfsp->vfs_data;
3427248571Smm	ASSERT(!dsl_pool_config_held(dmu_objset_pool(zfsvfs->z_os)));
3428248571Smm
3429248571Smm	if (vn_vfswlock(vfsp->vfs_vnodecovered) != 0) {
3430168404Spjd		VFS_RELE(vfsp);
3431248571Smm		return;
3432168404Spjd	}
3433248571Smm	VFS_RELE(vfsp);
3434248571Smm
3435248571Smm	/*
3436248571Smm	 * Always force the unmount for snapshots.
3437248571Smm	 */
3438248571Smm
3439248571Smm#ifdef illumos
3440248571Smm	(void) dounmount(vfsp, MS_FORCE, kcred);
3441248571Smm#else
3442248571Smm	mtx_lock(&Giant);	/* dounmount() */
3443248571Smm	dounmount(vfsp, MS_FORCE, curthread);
3444248571Smm	mtx_unlock(&Giant);	/* dounmount() */
3445248571Smm#endif
3446248571Smm}
3447248571Smm
3448248571Smm/* ARGSUSED */
3449248571Smmstatic int
3450248571Smmzfs_unmount_snap_cb(const char *snapname, void *arg)
3451248571Smm{
3452248571Smm	zfs_unmount_snap(snapname);
3453168404Spjd	return (0);
3454168404Spjd}
3455168404Spjd
3456185029Spjd/*
3457248571Smm * When a clone is destroyed, its origin may also need to be destroyed,
3458248571Smm * in which case it must be unmounted.  This routine will do that unmount
3459248571Smm * if necessary.
3460248571Smm */
3461248571Smmvoid
3462248571Smmzfs_destroy_unmount_origin(const char *fsname)
3463248571Smm{
3464248571Smm	int error;
3465248571Smm	objset_t *os;
3466248571Smm	dsl_dataset_t *ds;
3467248571Smm
3468248571Smm	error = dmu_objset_hold(fsname, FTAG, &os);
3469248571Smm	if (error != 0)
3470248571Smm		return;
3471248571Smm	ds = dmu_objset_ds(os);
3472248571Smm	if (dsl_dir_is_clone(ds->ds_dir) && DS_IS_DEFER_DESTROY(ds->ds_prev)) {
3473248571Smm		char originname[MAXNAMELEN];
3474248571Smm		dsl_dataset_name(ds->ds_prev, originname);
3475248571Smm		dmu_objset_rele(os, FTAG);
3476248571Smm		zfs_unmount_snap(originname);
3477248571Smm	} else {
3478248571Smm		dmu_objset_rele(os, FTAG);
3479248571Smm	}
3480248571Smm}
3481248571Smm
3482248571Smm/*
3483248571Smm * innvl: {
3484248571Smm *     "snaps" -> { snapshot1, snapshot2 }
3485248571Smm *     (optional boolean) "defer"
3486248571Smm * }
3487185029Spjd *
3488248571Smm * outnvl: snapshot -> error code (int32)
3489248571Smm *
3490185029Spjd */
3491168404Spjdstatic int
3492248571Smmzfs_ioc_destroy_snaps(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
3493168404Spjd{
3494248571Smm	int poollen;
3495248571Smm	nvlist_t *snaps;
3496228103Smm	nvpair_t *pair;
3497248571Smm	boolean_t defer;
3498168404Spjd
3499248571Smm	if (nvlist_lookup_nvlist(innvl, "snaps", &snaps) != 0)
3500249195Smm		return (SET_ERROR(EINVAL));
3501248571Smm	defer = nvlist_exists(innvl, "defer");
3502228103Smm
3503248571Smm	poollen = strlen(poolname);
3504248571Smm	for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
3505248571Smm	    pair = nvlist_next_nvpair(snaps, pair)) {
3506228103Smm		const char *name = nvpair_name(pair);
3507248571Smm
3508228103Smm		/*
3509248571Smm		 * The snap must be in the specified pool.
3510228103Smm		 */
3511248571Smm		if (strncmp(name, poolname, poollen) != 0 ||
3512248571Smm		    (name[poollen] != '/' && name[poollen] != '@'))
3513249195Smm			return (SET_ERROR(EXDEV));
3514228103Smm
3515248571Smm		zfs_unmount_snap(name);
3516242862Savg		(void) zvol_remove_minor(name);
3517228103Smm	}
3518228103Smm
3519248571Smm	return (dsl_destroy_snapshots_nvl(snaps, defer, outnvl));
3520168404Spjd}
3521168404Spjd
3522185029Spjd/*
3523185029Spjd * inputs:
3524185029Spjd * zc_name		name of dataset to destroy
3525185029Spjd * zc_objset_type	type of objset
3526219089Spjd * zc_defer_destroy	mark for deferred destroy
3527185029Spjd *
3528185029Spjd * outputs:		none
3529185029Spjd */
3530168404Spjdstatic int
3531168404Spjdzfs_ioc_destroy(zfs_cmd_t *zc)
3532168404Spjd{
3533219089Spjd	int err;
3534248571Smm	if (strchr(zc->zc_name, '@') && zc->zc_objset_type == DMU_OST_ZFS)
3535248571Smm		zfs_unmount_snap(zc->zc_name);
3536168404Spjd
3537248571Smm	if (strchr(zc->zc_name, '@'))
3538248571Smm		err = dsl_destroy_snapshot(zc->zc_name, zc->zc_defer_destroy);
3539248571Smm	else
3540248571Smm		err = dsl_destroy_head(zc->zc_name);
3541219089Spjd	if (zc->zc_objset_type == DMU_OST_ZVOL && err == 0)
3542219089Spjd		(void) zvol_remove_minor(zc->zc_name);
3543219089Spjd	return (err);
3544168404Spjd}
3545168404Spjd
3546185029Spjd/*
3547185029Spjd * inputs:
3548185029Spjd * zc_name	name of dataset to rollback (to most recent snapshot)
3549185029Spjd *
3550185029Spjd * outputs:	none
3551185029Spjd */
3552168404Spjdstatic int
3553168404Spjdzfs_ioc_rollback(zfs_cmd_t *zc)
3554168404Spjd{
3555248571Smm	zfsvfs_t *zfsvfs;
3556185029Spjd	int error;
3557185029Spjd
3558209962Smm	if (getzfsvfs(zc->zc_name, &zfsvfs) == 0) {
3559219089Spjd		error = zfs_suspend_fs(zfsvfs);
3560185029Spjd		if (error == 0) {
3561185029Spjd			int resume_err;
3562185029Spjd
3563248571Smm			error = dsl_dataset_rollback(zc->zc_name);
3564219089Spjd			resume_err = zfs_resume_fs(zfsvfs, zc->zc_name);
3565185029Spjd			error = error ? error : resume_err;
3566185029Spjd		}
3567185029Spjd		VFS_RELE(zfsvfs->z_vfs);
3568185029Spjd	} else {
3569248571Smm		error = dsl_dataset_rollback(zc->zc_name);
3570185029Spjd	}
3571248571Smm	return (error);
3572248571Smm}
3573185029Spjd
3574248571Smmstatic int
3575248571Smmrecursive_unmount(const char *fsname, void *arg)
3576248571Smm{
3577248571Smm	const char *snapname = arg;
3578248571Smm	char fullname[MAXNAMELEN];
3579219089Spjd
3580248571Smm	(void) snprintf(fullname, sizeof (fullname), "%s@%s", fsname, snapname);
3581248571Smm	zfs_unmount_snap(fullname);
3582248571Smm	return (0);
3583168404Spjd}
3584168404Spjd
3585185029Spjd/*
3586185029Spjd * inputs:
3587185029Spjd * zc_name	old name of dataset
3588185029Spjd * zc_value	new name of dataset
3589185029Spjd * zc_cookie	recursive flag (only valid for snapshots)
3590185029Spjd *
3591185029Spjd * outputs:	none
3592185029Spjd */
3593168404Spjdstatic int
3594168404Spjdzfs_ioc_rename(zfs_cmd_t *zc)
3595168404Spjd{
3596248571Smm	boolean_t recursive = zc->zc_cookie & 1;
3597248571Smm#ifdef __FreeBSD__
3598248571Smm	boolean_t allow_mounted = zc->zc_cookie & 2;
3599248571Smm#endif
3600248571Smm	char *at;
3601168676Spjd
3602168404Spjd	zc->zc_value[sizeof (zc->zc_value) - 1] = '\0';
3603185029Spjd	if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3604185029Spjd	    strchr(zc->zc_value, '%'))
3605249195Smm		return (SET_ERROR(EINVAL));
3606168404Spjd
3607248571Smm	at = strchr(zc->zc_name, '@');
3608248571Smm	if (at != NULL) {
3609248571Smm		/* snaps must be in same fs */
3610248571Smm		if (strncmp(zc->zc_name, zc->zc_value, at - zc->zc_name + 1))
3611249195Smm			return (SET_ERROR(EXDEV));
3612248571Smm		*at = '\0';
3613248571Smm#ifdef illumos
3614248571Smm		if (zc->zc_objset_type == DMU_OST_ZFS) {
3615248571Smm#else
3616248571Smm		if (zc->zc_objset_type == DMU_OST_ZFS && allow_mounted) {
3617248571Smm#endif
3618248571Smm			int error = dmu_objset_find(zc->zc_name,
3619248571Smm			    recursive_unmount, at + 1,
3620248571Smm			    recursive ? DS_FIND_CHILDREN : 0);
3621248571Smm			if (error != 0)
3622248571Smm				return (error);
3623248571Smm		}
3624248571Smm		return (dsl_dataset_rename_snapshot(zc->zc_name,
3625248571Smm		    at + 1, strchr(zc->zc_value, '@') + 1, recursive));
3626248571Smm	} else {
3627248571Smm#ifdef illumos
3628248571Smm		if (zc->zc_objset_type == DMU_OST_ZVOL)
3629248571Smm			(void) zvol_remove_minor(zc->zc_name);
3630248571Smm#endif
3631248571Smm		return (dsl_dir_rename(zc->zc_name, zc->zc_value));
3632168404Spjd	}
3633168404Spjd}
3634168404Spjd
3635219089Spjdstatic int
3636219089Spjdzfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
3637185029Spjd{
3638219089Spjd	const char *propname = nvpair_name(pair);
3639219089Spjd	boolean_t issnap = (strchr(dsname, '@') != NULL);
3640219089Spjd	zfs_prop_t prop = zfs_name_to_prop(propname);
3641219089Spjd	uint64_t intval;
3642219089Spjd	int err;
3643219089Spjd
3644219089Spjd	if (prop == ZPROP_INVAL) {
3645219089Spjd		if (zfs_prop_user(propname)) {
3646219089Spjd			if (err = zfs_secpolicy_write_perms(dsname,
3647219089Spjd			    ZFS_DELEG_PERM_USERPROP, cr))
3648219089Spjd				return (err);
3649219089Spjd			return (0);
3650219089Spjd		}
3651219089Spjd
3652219089Spjd		if (!issnap && zfs_prop_userquota(propname)) {
3653219089Spjd			const char *perm = NULL;
3654219089Spjd			const char *uq_prefix =
3655219089Spjd			    zfs_userquota_prop_prefixes[ZFS_PROP_USERQUOTA];
3656219089Spjd			const char *gq_prefix =
3657219089Spjd			    zfs_userquota_prop_prefixes[ZFS_PROP_GROUPQUOTA];
3658219089Spjd
3659219089Spjd			if (strncmp(propname, uq_prefix,
3660219089Spjd			    strlen(uq_prefix)) == 0) {
3661219089Spjd				perm = ZFS_DELEG_PERM_USERQUOTA;
3662219089Spjd			} else if (strncmp(propname, gq_prefix,
3663219089Spjd			    strlen(gq_prefix)) == 0) {
3664219089Spjd				perm = ZFS_DELEG_PERM_GROUPQUOTA;
3665219089Spjd			} else {
3666219089Spjd				/* USERUSED and GROUPUSED are read-only */
3667249195Smm				return (SET_ERROR(EINVAL));
3668219089Spjd			}
3669219089Spjd
3670219089Spjd			if (err = zfs_secpolicy_write_perms(dsname, perm, cr))
3671219089Spjd				return (err);
3672219089Spjd			return (0);
3673219089Spjd		}
3674219089Spjd
3675249195Smm		return (SET_ERROR(EINVAL));
3676219089Spjd	}
3677219089Spjd
3678219089Spjd	if (issnap)
3679249195Smm		return (SET_ERROR(EINVAL));
3680219089Spjd
3681219089Spjd	if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
3682219089Spjd		/*
3683219089Spjd		 * dsl_prop_get_all_impl() returns properties in this
3684219089Spjd		 * format.
3685219089Spjd		 */
3686219089Spjd		nvlist_t *attrs;
3687219089Spjd		VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
3688219089Spjd		VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3689219089Spjd		    &pair) == 0);
3690219089Spjd	}
3691219089Spjd
3692219089Spjd	/*
3693219089Spjd	 * Check that this value is valid for this pool version
3694219089Spjd	 */
3695219089Spjd	switch (prop) {
3696219089Spjd	case ZFS_PROP_COMPRESSION:
3697219089Spjd		/*
3698219089Spjd		 * If the user specified gzip compression, make sure
3699219089Spjd		 * the SPA supports it. We ignore any errors here since
3700219089Spjd		 * we'll catch them later.
3701219089Spjd		 */
3702219089Spjd		if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3703219089Spjd		    nvpair_value_uint64(pair, &intval) == 0) {
3704219089Spjd			if (intval >= ZIO_COMPRESS_GZIP_1 &&
3705219089Spjd			    intval <= ZIO_COMPRESS_GZIP_9 &&
3706219089Spjd			    zfs_earlier_version(dsname,
3707219089Spjd			    SPA_VERSION_GZIP_COMPRESSION)) {
3708249195Smm				return (SET_ERROR(ENOTSUP));
3709219089Spjd			}
3710219089Spjd
3711219089Spjd			if (intval == ZIO_COMPRESS_ZLE &&
3712219089Spjd			    zfs_earlier_version(dsname,
3713219089Spjd			    SPA_VERSION_ZLE_COMPRESSION))
3714249195Smm				return (SET_ERROR(ENOTSUP));
3715219089Spjd
3716246586Sdelphij			if (intval == ZIO_COMPRESS_LZ4) {
3717246586Sdelphij				zfeature_info_t *feature =
3718246586Sdelphij				    &spa_feature_table[
3719246586Sdelphij				    SPA_FEATURE_LZ4_COMPRESS];
3720246586Sdelphij				spa_t *spa;
3721246586Sdelphij
3722246586Sdelphij				if ((err = spa_open(dsname, &spa, FTAG)) != 0)
3723246586Sdelphij					return (err);
3724246586Sdelphij
3725246586Sdelphij				if (!spa_feature_is_enabled(spa, feature)) {
3726246586Sdelphij					spa_close(spa, FTAG);
3727249195Smm					return (SET_ERROR(ENOTSUP));
3728246586Sdelphij				}
3729246586Sdelphij				spa_close(spa, FTAG);
3730246586Sdelphij			}
3731246586Sdelphij
3732219089Spjd			/*
3733219089Spjd			 * If this is a bootable dataset then
3734219089Spjd			 * verify that the compression algorithm
3735219089Spjd			 * is supported for booting. We must return
3736219089Spjd			 * something other than ENOTSUP since it
3737219089Spjd			 * implies a downrev pool version.
3738219089Spjd			 */
3739219089Spjd			if (zfs_is_bootfs(dsname) &&
3740219089Spjd			    !BOOTFS_COMPRESS_VALID(intval)) {
3741249195Smm				return (SET_ERROR(ERANGE));
3742219089Spjd			}
3743219089Spjd		}
3744219089Spjd		break;
3745219089Spjd
3746219089Spjd	case ZFS_PROP_COPIES:
3747219089Spjd		if (zfs_earlier_version(dsname, SPA_VERSION_DITTO_BLOCKS))
3748249195Smm			return (SET_ERROR(ENOTSUP));
3749219089Spjd		break;
3750219089Spjd
3751219089Spjd	case ZFS_PROP_DEDUP:
3752219089Spjd		if (zfs_earlier_version(dsname, SPA_VERSION_DEDUP))
3753249195Smm			return (SET_ERROR(ENOTSUP));
3754219089Spjd		break;
3755219089Spjd
3756219089Spjd	case ZFS_PROP_SHARESMB:
3757219089Spjd		if (zpl_earlier_version(dsname, ZPL_VERSION_FUID))
3758249195Smm			return (SET_ERROR(ENOTSUP));
3759219089Spjd		break;
3760219089Spjd
3761219089Spjd	case ZFS_PROP_ACLINHERIT:
3762219089Spjd		if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3763219089Spjd		    nvpair_value_uint64(pair, &intval) == 0) {
3764219089Spjd			if (intval == ZFS_ACL_PASSTHROUGH_X &&
3765219089Spjd			    zfs_earlier_version(dsname,
3766219089Spjd			    SPA_VERSION_PASSTHROUGH_X))
3767249195Smm				return (SET_ERROR(ENOTSUP));
3768219089Spjd		}
3769219089Spjd		break;
3770219089Spjd	}
3771219089Spjd
3772219089Spjd	return (zfs_secpolicy_setprop(dsname, prop, pair, CRED()));
3773219089Spjd}
3774219089Spjd
3775219089Spjd/*
3776246586Sdelphij * Checks for a race condition to make sure we don't increment a feature flag
3777246586Sdelphij * multiple times.
3778246586Sdelphij */
3779246586Sdelphijstatic int
3780248571Smmzfs_prop_activate_feature_check(void *arg, dmu_tx_t *tx)
3781246586Sdelphij{
3782248571Smm	spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3783248571Smm	zfeature_info_t *feature = arg;
3784246586Sdelphij
3785246586Sdelphij	if (!spa_feature_is_active(spa, feature))
3786246586Sdelphij		return (0);
3787246586Sdelphij	else
3788249195Smm		return (SET_ERROR(EBUSY));
3789246586Sdelphij}
3790246586Sdelphij
3791246586Sdelphij/*
3792246586Sdelphij * The callback invoked on feature activation in the sync task caused by
3793246586Sdelphij * zfs_prop_activate_feature.
3794246586Sdelphij */
3795246586Sdelphijstatic void
3796248571Smmzfs_prop_activate_feature_sync(void *arg, dmu_tx_t *tx)
3797246586Sdelphij{
3798248571Smm	spa_t *spa = dmu_tx_pool(tx)->dp_spa;
3799248571Smm	zfeature_info_t *feature = arg;
3800246586Sdelphij
3801246586Sdelphij	spa_feature_incr(spa, feature, tx);
3802246586Sdelphij}
3803246586Sdelphij
3804246586Sdelphij/*
3805248571Smm * Activates a feature on a pool in response to a property setting. This
3806248571Smm * creates a new sync task which modifies the pool to reflect the feature
3807248571Smm * as being active.
3808248571Smm */
3809248571Smmstatic int
3810248571Smmzfs_prop_activate_feature(spa_t *spa, zfeature_info_t *feature)
3811248571Smm{
3812248571Smm	int err;
3813248571Smm
3814248571Smm	/* EBUSY here indicates that the feature is already active */
3815248571Smm	err = dsl_sync_task(spa_name(spa),
3816248571Smm	    zfs_prop_activate_feature_check, zfs_prop_activate_feature_sync,
3817248571Smm	    feature, 2);
3818248571Smm
3819248571Smm	if (err != 0 && err != EBUSY)
3820248571Smm		return (err);
3821248571Smm	else
3822248571Smm		return (0);
3823248571Smm}
3824248571Smm
3825248571Smm/*
3826219089Spjd * Removes properties from the given props list that fail permission checks
3827219089Spjd * needed to clear them and to restore them in case of a receive error. For each
3828219089Spjd * property, make sure we have both set and inherit permissions.
3829219089Spjd *
3830219089Spjd * Returns the first error encountered if any permission checks fail. If the
3831219089Spjd * caller provides a non-NULL errlist, it also gives the complete list of names
3832219089Spjd * of all the properties that failed a permission check along with the
3833219089Spjd * corresponding error numbers. The caller is responsible for freeing the
3834219089Spjd * returned errlist.
3835219089Spjd *
3836219089Spjd * If every property checks out successfully, zero is returned and the list
3837219089Spjd * pointed at by errlist is NULL.
3838219089Spjd */
3839219089Spjdstatic int
3840219089Spjdzfs_check_clearable(char *dataset, nvlist_t *props, nvlist_t **errlist)
3841219089Spjd{
3842185029Spjd	zfs_cmd_t *zc;
3843219089Spjd	nvpair_t *pair, *next_pair;
3844219089Spjd	nvlist_t *errors;
3845219089Spjd	int err, rv = 0;
3846185029Spjd
3847185029Spjd	if (props == NULL)
3848219089Spjd		return (0);
3849219089Spjd
3850219089Spjd	VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
3851219089Spjd
3852185029Spjd	zc = kmem_alloc(sizeof (zfs_cmd_t), KM_SLEEP);
3853185029Spjd	(void) strcpy(zc->zc_name, dataset);
3854219089Spjd	pair = nvlist_next_nvpair(props, NULL);
3855219089Spjd	while (pair != NULL) {
3856219089Spjd		next_pair = nvlist_next_nvpair(props, pair);
3857219089Spjd
3858219089Spjd		(void) strcpy(zc->zc_value, nvpair_name(pair));
3859219089Spjd		if ((err = zfs_check_settable(dataset, pair, CRED())) != 0 ||
3860248571Smm		    (err = zfs_secpolicy_inherit_prop(zc, NULL, CRED())) != 0) {
3861219089Spjd			VERIFY(nvlist_remove_nvpair(props, pair) == 0);
3862219089Spjd			VERIFY(nvlist_add_int32(errors,
3863219089Spjd			    zc->zc_value, err) == 0);
3864219089Spjd		}
3865219089Spjd		pair = next_pair;
3866185029Spjd	}
3867185029Spjd	kmem_free(zc, sizeof (zfs_cmd_t));
3868219089Spjd
3869219089Spjd	if ((pair = nvlist_next_nvpair(errors, NULL)) == NULL) {
3870219089Spjd		nvlist_free(errors);
3871219089Spjd		errors = NULL;
3872219089Spjd	} else {
3873219089Spjd		VERIFY(nvpair_value_int32(pair, &rv) == 0);
3874219089Spjd	}
3875219089Spjd
3876219089Spjd	if (errlist == NULL)
3877219089Spjd		nvlist_free(errors);
3878219089Spjd	else
3879219089Spjd		*errlist = errors;
3880219089Spjd
3881219089Spjd	return (rv);
3882185029Spjd}
3883185029Spjd
3884219089Spjdstatic boolean_t
3885219089Spjdpropval_equals(nvpair_t *p1, nvpair_t *p2)
3886219089Spjd{
3887219089Spjd	if (nvpair_type(p1) == DATA_TYPE_NVLIST) {
3888219089Spjd		/* dsl_prop_get_all_impl() format */
3889219089Spjd		nvlist_t *attrs;
3890219089Spjd		VERIFY(nvpair_value_nvlist(p1, &attrs) == 0);
3891219089Spjd		VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3892219089Spjd		    &p1) == 0);
3893219089Spjd	}
3894219089Spjd
3895219089Spjd	if (nvpair_type(p2) == DATA_TYPE_NVLIST) {
3896219089Spjd		nvlist_t *attrs;
3897219089Spjd		VERIFY(nvpair_value_nvlist(p2, &attrs) == 0);
3898219089Spjd		VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3899219089Spjd		    &p2) == 0);
3900219089Spjd	}
3901219089Spjd
3902219089Spjd	if (nvpair_type(p1) != nvpair_type(p2))
3903219089Spjd		return (B_FALSE);
3904219089Spjd
3905219089Spjd	if (nvpair_type(p1) == DATA_TYPE_STRING) {
3906219089Spjd		char *valstr1, *valstr2;
3907219089Spjd
3908219089Spjd		VERIFY(nvpair_value_string(p1, (char **)&valstr1) == 0);
3909219089Spjd		VERIFY(nvpair_value_string(p2, (char **)&valstr2) == 0);
3910219089Spjd		return (strcmp(valstr1, valstr2) == 0);
3911219089Spjd	} else {
3912219089Spjd		uint64_t intval1, intval2;
3913219089Spjd
3914219089Spjd		VERIFY(nvpair_value_uint64(p1, &intval1) == 0);
3915219089Spjd		VERIFY(nvpair_value_uint64(p2, &intval2) == 0);
3916219089Spjd		return (intval1 == intval2);
3917219089Spjd	}
3918219089Spjd}
3919219089Spjd
3920185029Spjd/*
3921219089Spjd * Remove properties from props if they are not going to change (as determined
3922219089Spjd * by comparison with origprops). Remove them from origprops as well, since we
3923219089Spjd * do not need to clear or restore properties that won't change.
3924219089Spjd */
3925219089Spjdstatic void
3926219089Spjdprops_reduce(nvlist_t *props, nvlist_t *origprops)
3927219089Spjd{
3928219089Spjd	nvpair_t *pair, *next_pair;
3929219089Spjd
3930219089Spjd	if (origprops == NULL)
3931219089Spjd		return; /* all props need to be received */
3932219089Spjd
3933219089Spjd	pair = nvlist_next_nvpair(props, NULL);
3934219089Spjd	while (pair != NULL) {
3935219089Spjd		const char *propname = nvpair_name(pair);
3936219089Spjd		nvpair_t *match;
3937219089Spjd
3938219089Spjd		next_pair = nvlist_next_nvpair(props, pair);
3939219089Spjd
3940219089Spjd		if ((nvlist_lookup_nvpair(origprops, propname,
3941219089Spjd		    &match) != 0) || !propval_equals(pair, match))
3942219089Spjd			goto next; /* need to set received value */
3943219089Spjd
3944219089Spjd		/* don't clear the existing received value */
3945219089Spjd		(void) nvlist_remove_nvpair(origprops, match);
3946219089Spjd		/* don't bother receiving the property */
3947219089Spjd		(void) nvlist_remove_nvpair(props, pair);
3948219089Spjdnext:
3949219089Spjd		pair = next_pair;
3950219089Spjd	}
3951219089Spjd}
3952219089Spjd
3953219089Spjd#ifdef	DEBUG
3954219089Spjdstatic boolean_t zfs_ioc_recv_inject_err;
3955219089Spjd#endif
3956219089Spjd
3957219089Spjd/*
3958185029Spjd * inputs:
3959185029Spjd * zc_name		name of containing filesystem
3960185029Spjd * zc_nvlist_src{_size}	nvlist of properties to apply
3961185029Spjd * zc_value		name of snapshot to create
3962185029Spjd * zc_string		name of clone origin (if DRR_FLAG_CLONE)
3963185029Spjd * zc_cookie		file descriptor to recv from
3964185029Spjd * zc_begin_record	the BEGIN record of the stream (not byteswapped)
3965185029Spjd * zc_guid		force flag
3966219089Spjd * zc_cleanup_fd	cleanup-on-exit file descriptor
3967219089Spjd * zc_action_handle	handle for this guid/ds mapping (or zero on first call)
3968185029Spjd *
3969185029Spjd * outputs:
3970185029Spjd * zc_cookie		number of bytes read
3971219089Spjd * zc_nvlist_dst{_size} error for each unapplied received property
3972219089Spjd * zc_obj		zprop_errflags_t
3973219089Spjd * zc_action_handle	handle for this guid/ds mapping
3974185029Spjd */
3975168404Spjdstatic int
3976185029Spjdzfs_ioc_recv(zfs_cmd_t *zc)
3977168404Spjd{
3978185029Spjd	file_t *fp;
3979185029Spjd	dmu_recv_cookie_t drc;
3980185029Spjd	boolean_t force = (boolean_t)zc->zc_guid;
3981219089Spjd	int fd;
3982219089Spjd	int error = 0;
3983219089Spjd	int props_error = 0;
3984219089Spjd	nvlist_t *errors;
3985185029Spjd	offset_t off;
3986219089Spjd	nvlist_t *props = NULL; /* sent properties */
3987219089Spjd	nvlist_t *origprops = NULL; /* existing properties */
3988248571Smm	char *origin = NULL;
3989185029Spjd	char *tosnap;
3990185029Spjd	char tofs[ZFS_MAXNAMELEN];
3991219089Spjd	boolean_t first_recvd_props = B_FALSE;
3992168404Spjd
3993168404Spjd	if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3994185029Spjd	    strchr(zc->zc_value, '@') == NULL ||
3995185029Spjd	    strchr(zc->zc_value, '%'))
3996249195Smm		return (SET_ERROR(EINVAL));
3997168404Spjd
3998185029Spjd	(void) strcpy(tofs, zc->zc_value);
3999185029Spjd	tosnap = strchr(tofs, '@');
4000219089Spjd	*tosnap++ = '\0';
4001185029Spjd
4002185029Spjd	if (zc->zc_nvlist_src != 0 &&
4003185029Spjd	    (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
4004219089Spjd	    zc->zc_iflags, &props)) != 0)
4005168404Spjd		return (error);
4006168404Spjd
4007185029Spjd	fd = zc->zc_cookie;
4008247602Spjd	fp = getf(fd, CAP_PREAD);
4009185029Spjd	if (fp == NULL) {
4010185029Spjd		nvlist_free(props);
4011249195Smm		return (SET_ERROR(EBADF));
4012185029Spjd	}
4013168404Spjd
4014219089Spjd	VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
4015219089Spjd
4016248571Smm	if (zc->zc_string[0])
4017248571Smm		origin = zc->zc_string;
4018248571Smm
4019248571Smm	error = dmu_recv_begin(tofs, tosnap,
4020248571Smm	    &zc->zc_begin_record, force, origin, &drc);
4021248571Smm	if (error != 0)
4022248571Smm		goto out;
4023248571Smm
4024248571Smm	/*
4025248571Smm	 * Set properties before we receive the stream so that they are applied
4026248571Smm	 * to the new data. Note that we must call dmu_recv_stream() if
4027248571Smm	 * dmu_recv_begin() succeeds.
4028248571Smm	 */
4029248571Smm	if (props != NULL && !drc.drc_newfs) {
4030248571Smm		if (spa_version(dsl_dataset_get_spa(drc.drc_ds)) >=
4031248571Smm		    SPA_VERSION_RECVD_PROPS &&
4032248571Smm		    !dsl_prop_get_hasrecvd(tofs))
4033219089Spjd			first_recvd_props = B_TRUE;
4034219089Spjd
4035185029Spjd		/*
4036219089Spjd		 * If new received properties are supplied, they are to
4037219089Spjd		 * completely replace the existing received properties, so stash
4038219089Spjd		 * away the existing ones.
4039185029Spjd		 */
4040248571Smm		if (dsl_prop_get_received(tofs, &origprops) == 0) {
4041219089Spjd			nvlist_t *errlist = NULL;
4042219089Spjd			/*
4043219089Spjd			 * Don't bother writing a property if its value won't
4044219089Spjd			 * change (and avoid the unnecessary security checks).
4045219089Spjd			 *
4046219089Spjd			 * The first receive after SPA_VERSION_RECVD_PROPS is a
4047219089Spjd			 * special case where we blow away all local properties
4048219089Spjd			 * regardless.
4049219089Spjd			 */
4050219089Spjd			if (!first_recvd_props)
4051219089Spjd				props_reduce(props, origprops);
4052248571Smm			if (zfs_check_clearable(tofs, origprops, &errlist) != 0)
4053219089Spjd				(void) nvlist_merge(errors, errlist, 0);
4054219089Spjd			nvlist_free(errlist);
4055248571Smm
4056248571Smm			if (clear_received_props(tofs, origprops,
4057248571Smm			    first_recvd_props ? NULL : props) != 0)
4058248571Smm				zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4059248571Smm		} else {
4060248571Smm			zc->zc_obj |= ZPROP_ERR_NOCLEAR;
4061219089Spjd		}
4062185029Spjd	}
4063185029Spjd
4064248571Smm	if (props != NULL) {
4065248571Smm		props_error = dsl_prop_set_hasrecvd(tofs);
4066185029Spjd
4067248571Smm		if (props_error == 0) {
4068248571Smm			(void) zfs_set_prop_nvlist(tofs, ZPROP_SRC_RECEIVED,
4069248571Smm			    props, errors);
4070219089Spjd		}
4071219089Spjd	}
4072219089Spjd
4073248571Smm	if (zc->zc_nvlist_dst_size != 0 &&
4074248571Smm	    (nvlist_smush(errors, zc->zc_nvlist_dst_size) != 0 ||
4075248571Smm	    put_nvlist(zc, errors) != 0)) {
4076185029Spjd		/*
4077219089Spjd		 * Caller made zc->zc_nvlist_dst less than the minimum expected
4078219089Spjd		 * size or supplied an invalid address.
4079185029Spjd		 */
4080249195Smm		props_error = SET_ERROR(EINVAL);
4081185029Spjd	}
4082185029Spjd
4083185029Spjd	off = fp->f_offset;
4084219089Spjd	error = dmu_recv_stream(&drc, fp, &off, zc->zc_cleanup_fd,
4085219089Spjd	    &zc->zc_action_handle);
4086185029Spjd
4087219089Spjd	if (error == 0) {
4088219089Spjd		zfsvfs_t *zfsvfs = NULL;
4089185029Spjd
4090219089Spjd		if (getzfsvfs(tofs, &zfsvfs) == 0) {
4091219089Spjd			/* online recv */
4092219089Spjd			int end_err;
4093185029Spjd
4094219089Spjd			error = zfs_suspend_fs(zfsvfs);
4095219089Spjd			/*
4096219089Spjd			 * If the suspend fails, then the recv_end will
4097219089Spjd			 * likely also fail, and clean up after itself.
4098219089Spjd			 */
4099219089Spjd			end_err = dmu_recv_end(&drc);
4100219089Spjd			if (error == 0)
4101219089Spjd				error = zfs_resume_fs(zfsvfs, tofs);
4102219089Spjd			error = error ? error : end_err;
4103219089Spjd			VFS_RELE(zfsvfs->z_vfs);
4104219089Spjd		} else {
4105185029Spjd			error = dmu_recv_end(&drc);
4106185029Spjd		}
4107185029Spjd	}
4108185029Spjd
4109185029Spjd	zc->zc_cookie = off - fp->f_offset;
4110185029Spjd	if (off >= 0 && off <= MAXOFFSET_T)
4111185029Spjd		fp->f_offset = off;
4112185029Spjd
4113219089Spjd#ifdef	DEBUG
4114219089Spjd	if (zfs_ioc_recv_inject_err) {
4115219089Spjd		zfs_ioc_recv_inject_err = B_FALSE;
4116219089Spjd		error = 1;
4117219089Spjd	}
4118219089Spjd#endif
4119243497Savg
4120243497Savg#ifdef __FreeBSD__
4121243497Savg	if (error == 0)
4122243497Savg		zvol_create_minors(tofs);
4123243497Savg#endif
4124243497Savg
4125185029Spjd	/*
4126185029Spjd	 * On error, restore the original props.
4127185029Spjd	 */
4128248571Smm	if (error != 0 && props != NULL && !drc.drc_newfs) {
4129248571Smm		if (clear_received_props(tofs, props, NULL) != 0) {
4130248571Smm			/*
4131248571Smm			 * We failed to clear the received properties.
4132248571Smm			 * Since we may have left a $recvd value on the
4133248571Smm			 * system, we can't clear the $hasrecvd flag.
4134248571Smm			 */
4135219089Spjd			zc->zc_obj |= ZPROP_ERR_NORESTORE;
4136248571Smm		} else if (first_recvd_props) {
4137248571Smm			dsl_prop_unset_hasrecvd(tofs);
4138219089Spjd		}
4139219089Spjd
4140219089Spjd		if (origprops == NULL && !drc.drc_newfs) {
4141219089Spjd			/* We failed to stash the original properties. */
4142219089Spjd			zc->zc_obj |= ZPROP_ERR_NORESTORE;
4143219089Spjd		}
4144219089Spjd
4145219089Spjd		/*
4146219089Spjd		 * dsl_props_set() will not convert RECEIVED to LOCAL on or
4147219089Spjd		 * after SPA_VERSION_RECVD_PROPS, so we need to specify LOCAL
4148219089Spjd		 * explictly if we're restoring local properties cleared in the
4149219089Spjd		 * first new-style receive.
4150219089Spjd		 */
4151219089Spjd		if (origprops != NULL &&
4152219089Spjd		    zfs_set_prop_nvlist(tofs, (first_recvd_props ?
4153219089Spjd		    ZPROP_SRC_LOCAL : ZPROP_SRC_RECEIVED),
4154219089Spjd		    origprops, NULL) != 0) {
4155219089Spjd			/*
4156219089Spjd			 * We stashed the original properties but failed to
4157219089Spjd			 * restore them.
4158219089Spjd			 */
4159219089Spjd			zc->zc_obj |= ZPROP_ERR_NORESTORE;
4160219089Spjd		}
4161185029Spjd	}
4162185029Spjdout:
4163185029Spjd	nvlist_free(props);
4164185029Spjd	nvlist_free(origprops);
4165219089Spjd	nvlist_free(errors);
4166219089Spjd	releasef(fd);
4167219089Spjd
4168219089Spjd	if (error == 0)
4169219089Spjd		error = props_error;
4170219089Spjd
4171168404Spjd	return (error);
4172168404Spjd}
4173168404Spjd
4174185029Spjd/*
4175185029Spjd * inputs:
4176185029Spjd * zc_name	name of snapshot to send
4177185029Spjd * zc_cookie	file descriptor to send stream to
4178219089Spjd * zc_obj	fromorigin flag (mutually exclusive with zc_fromobj)
4179219089Spjd * zc_sendobj	objsetid of snapshot to send
4180219089Spjd * zc_fromobj	objsetid of incremental fromsnap (may be zero)
4181228103Smm * zc_guid	if set, estimate size of stream only.  zc_cookie is ignored.
4182228103Smm *		output size in zc_objset_type.
4183185029Spjd *
4184185029Spjd * outputs: none
4185185029Spjd */
4186168404Spjdstatic int
4187185029Spjdzfs_ioc_send(zfs_cmd_t *zc)
4188168404Spjd{
4189185029Spjd	int error;
4190185029Spjd	offset_t off;
4191228103Smm	boolean_t estimate = (zc->zc_guid != 0);
4192168404Spjd
4193248571Smm	if (zc->zc_obj != 0) {
4194248571Smm		dsl_pool_t *dp;
4195248571Smm		dsl_dataset_t *tosnap;
4196168404Spjd
4197248571Smm		error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4198248571Smm		if (error != 0)
4199248571Smm			return (error);
4200168404Spjd
4201248571Smm		error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4202248571Smm		if (error != 0) {
4203248571Smm			dsl_pool_rele(dp, FTAG);
4204248571Smm			return (error);
4205248571Smm		}
4206248571Smm
4207248571Smm		if (dsl_dir_is_clone(tosnap->ds_dir))
4208248571Smm			zc->zc_fromobj = tosnap->ds_dir->dd_phys->dd_origin_obj;
4209248571Smm		dsl_dataset_rele(tosnap, FTAG);
4210248571Smm		dsl_pool_rele(dp, FTAG);
4211219089Spjd	}
4212219089Spjd
4213248571Smm	if (estimate) {
4214248571Smm		dsl_pool_t *dp;
4215248571Smm		dsl_dataset_t *tosnap;
4216248571Smm		dsl_dataset_t *fromsnap = NULL;
4217248571Smm
4218248571Smm		error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4219248571Smm		if (error != 0)
4220168404Spjd			return (error);
4221248571Smm
4222248571Smm		error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &tosnap);
4223248571Smm		if (error != 0) {
4224248571Smm			dsl_pool_rele(dp, FTAG);
4225219089Spjd			return (error);
4226219089Spjd		}
4227168404Spjd
4228248571Smm		if (zc->zc_fromobj != 0) {
4229248571Smm			error = dsl_dataset_hold_obj(dp, zc->zc_fromobj,
4230248571Smm			    FTAG, &fromsnap);
4231248571Smm			if (error != 0) {
4232248571Smm				dsl_dataset_rele(tosnap, FTAG);
4233248571Smm				dsl_pool_rele(dp, FTAG);
4234248571Smm				return (error);
4235248571Smm			}
4236248571Smm		}
4237248571Smm
4238248571Smm		error = dmu_send_estimate(tosnap, fromsnap,
4239228103Smm		    &zc->zc_objset_type);
4240248571Smm
4241248571Smm		if (fromsnap != NULL)
4242248571Smm			dsl_dataset_rele(fromsnap, FTAG);
4243248571Smm		dsl_dataset_rele(tosnap, FTAG);
4244248571Smm		dsl_pool_rele(dp, FTAG);
4245228103Smm	} else {
4246247602Spjd		file_t *fp = getf(zc->zc_cookie, CAP_WRITE);
4247248571Smm		if (fp == NULL)
4248249195Smm			return (SET_ERROR(EBADF));
4249168404Spjd
4250228103Smm		off = fp->f_offset;
4251248571Smm		error = dmu_send_obj(zc->zc_name, zc->zc_sendobj,
4252248571Smm#ifdef illumos
4253248571Smm		    zc->zc_fromobj, zc->zc_cookie, fp->f_vnode, &off);
4254248571Smm#else
4255248571Smm		    zc->zc_fromobj, zc->zc_cookie, fp, &off);
4256248571Smm#endif
4257168404Spjd
4258228103Smm		if (off >= 0 && off <= MAXOFFSET_T)
4259228103Smm			fp->f_offset = off;
4260228103Smm		releasef(zc->zc_cookie);
4261228103Smm	}
4262168404Spjd	return (error);
4263168404Spjd}
4264168404Spjd
4265235222Smm/*
4266235222Smm * inputs:
4267235222Smm * zc_name	name of snapshot on which to report progress
4268235222Smm * zc_cookie	file descriptor of send stream
4269235222Smm *
4270235222Smm * outputs:
4271235222Smm * zc_cookie	number of bytes written in send stream thus far
4272235222Smm */
4273168404Spjdstatic int
4274235222Smmzfs_ioc_send_progress(zfs_cmd_t *zc)
4275235222Smm{
4276248571Smm	dsl_pool_t *dp;
4277235222Smm	dsl_dataset_t *ds;
4278235222Smm	dmu_sendarg_t *dsp = NULL;
4279235222Smm	int error;
4280235222Smm
4281248571Smm	error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
4282248571Smm	if (error != 0)
4283235222Smm		return (error);
4284235222Smm
4285248571Smm	error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &ds);
4286248571Smm	if (error != 0) {
4287248571Smm		dsl_pool_rele(dp, FTAG);
4288248571Smm		return (error);
4289248571Smm	}
4290248571Smm
4291235222Smm	mutex_enter(&ds->ds_sendstream_lock);
4292235222Smm
4293235222Smm	/*
4294235222Smm	 * Iterate over all the send streams currently active on this dataset.
4295235222Smm	 * If there's one which matches the specified file descriptor _and_ the
4296235222Smm	 * stream was started by the current process, return the progress of
4297235222Smm	 * that stream.
4298235222Smm	 */
4299235222Smm	for (dsp = list_head(&ds->ds_sendstreams); dsp != NULL;
4300235222Smm	    dsp = list_next(&ds->ds_sendstreams, dsp)) {
4301235222Smm		if (dsp->dsa_outfd == zc->zc_cookie &&
4302235222Smm		    dsp->dsa_proc == curproc)
4303235222Smm			break;
4304235222Smm	}
4305235222Smm
4306235222Smm	if (dsp != NULL)
4307235222Smm		zc->zc_cookie = *(dsp->dsa_off);
4308235222Smm	else
4309249195Smm		error = SET_ERROR(ENOENT);
4310235222Smm
4311235222Smm	mutex_exit(&ds->ds_sendstream_lock);
4312235222Smm	dsl_dataset_rele(ds, FTAG);
4313248571Smm	dsl_pool_rele(dp, FTAG);
4314235222Smm	return (error);
4315235222Smm}
4316235222Smm
4317235222Smmstatic int
4318168404Spjdzfs_ioc_inject_fault(zfs_cmd_t *zc)
4319168404Spjd{
4320168404Spjd	int id, error;
4321168404Spjd
4322168404Spjd	error = zio_inject_fault(zc->zc_name, (int)zc->zc_guid, &id,
4323168404Spjd	    &zc->zc_inject_record);
4324168404Spjd
4325168404Spjd	if (error == 0)
4326168404Spjd		zc->zc_guid = (uint64_t)id;
4327168404Spjd
4328168404Spjd	return (error);
4329168404Spjd}
4330168404Spjd
4331168404Spjdstatic int
4332168404Spjdzfs_ioc_clear_fault(zfs_cmd_t *zc)
4333168404Spjd{
4334168404Spjd	return (zio_clear_fault((int)zc->zc_guid));
4335168404Spjd}
4336168404Spjd
4337168404Spjdstatic int
4338168404Spjdzfs_ioc_inject_list_next(zfs_cmd_t *zc)
4339168404Spjd{
4340168404Spjd	int id = (int)zc->zc_guid;
4341168404Spjd	int error;
4342168404Spjd
4343168404Spjd	error = zio_inject_list_next(&id, zc->zc_name, sizeof (zc->zc_name),
4344168404Spjd	    &zc->zc_inject_record);
4345168404Spjd
4346168404Spjd	zc->zc_guid = id;
4347168404Spjd
4348168404Spjd	return (error);
4349168404Spjd}
4350168404Spjd
4351168404Spjdstatic int
4352168404Spjdzfs_ioc_error_log(zfs_cmd_t *zc)
4353168404Spjd{
4354168404Spjd	spa_t *spa;
4355168404Spjd	int error;
4356168404Spjd	size_t count = (size_t)zc->zc_nvlist_dst_size;
4357168404Spjd
4358168404Spjd	if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
4359168404Spjd		return (error);
4360168404Spjd
4361168404Spjd	error = spa_get_errlog(spa, (void *)(uintptr_t)zc->zc_nvlist_dst,
4362168404Spjd	    &count);
4363168404Spjd	if (error == 0)
4364168404Spjd		zc->zc_nvlist_dst_size = count;
4365168404Spjd	else
4366168404Spjd		zc->zc_nvlist_dst_size = spa_get_errlog_size(spa);
4367168404Spjd
4368168404Spjd	spa_close(spa, FTAG);
4369168404Spjd
4370168404Spjd	return (error);
4371168404Spjd}
4372168404Spjd
4373168404Spjdstatic int
4374168404Spjdzfs_ioc_clear(zfs_cmd_t *zc)
4375168404Spjd{
4376168404Spjd	spa_t *spa;
4377168404Spjd	vdev_t *vd;
4378168404Spjd	int error;
4379168404Spjd
4380185029Spjd	/*
4381185029Spjd	 * On zpool clear we also fix up missing slogs
4382185029Spjd	 */
4383185029Spjd	mutex_enter(&spa_namespace_lock);
4384185029Spjd	spa = spa_lookup(zc->zc_name);
4385185029Spjd	if (spa == NULL) {
4386185029Spjd		mutex_exit(&spa_namespace_lock);
4387249195Smm		return (SET_ERROR(EIO));
4388185029Spjd	}
4389219089Spjd	if (spa_get_log_state(spa) == SPA_LOG_MISSING) {
4390185029Spjd		/* we need to let spa_open/spa_load clear the chains */
4391219089Spjd		spa_set_log_state(spa, SPA_LOG_CLEAR);
4392185029Spjd	}
4393219089Spjd	spa->spa_last_open_failed = 0;
4394185029Spjd	mutex_exit(&spa_namespace_lock);
4395185029Spjd
4396219089Spjd	if (zc->zc_cookie & ZPOOL_NO_REWIND) {
4397219089Spjd		error = spa_open(zc->zc_name, &spa, FTAG);
4398219089Spjd	} else {
4399219089Spjd		nvlist_t *policy;
4400219089Spjd		nvlist_t *config = NULL;
4401219089Spjd
4402219089Spjd		if (zc->zc_nvlist_src == 0)
4403249195Smm			return (SET_ERROR(EINVAL));
4404219089Spjd
4405219089Spjd		if ((error = get_nvlist(zc->zc_nvlist_src,
4406219089Spjd		    zc->zc_nvlist_src_size, zc->zc_iflags, &policy)) == 0) {
4407219089Spjd			error = spa_open_rewind(zc->zc_name, &spa, FTAG,
4408219089Spjd			    policy, &config);
4409219089Spjd			if (config != NULL) {
4410219089Spjd				int err;
4411219089Spjd
4412219089Spjd				if ((err = put_nvlist(zc, config)) != 0)
4413219089Spjd					error = err;
4414219089Spjd				nvlist_free(config);
4415219089Spjd			}
4416219089Spjd			nvlist_free(policy);
4417219089Spjd		}
4418219089Spjd	}
4419219089Spjd
4420248571Smm	if (error != 0)
4421168404Spjd		return (error);
4422168404Spjd
4423219089Spjd	spa_vdev_state_enter(spa, SCL_NONE);
4424168404Spjd
4425168404Spjd	if (zc->zc_guid == 0) {
4426168404Spjd		vd = NULL;
4427185029Spjd	} else {
4428185029Spjd		vd = spa_lookup_by_guid(spa, zc->zc_guid, B_TRUE);
4429185029Spjd		if (vd == NULL) {
4430185029Spjd			(void) spa_vdev_state_exit(spa, NULL, ENODEV);
4431185029Spjd			spa_close(spa, FTAG);
4432249195Smm			return (SET_ERROR(ENODEV));
4433185029Spjd		}
4434168404Spjd	}
4435168404Spjd
4436168404Spjd	vdev_clear(spa, vd);
4437168404Spjd
4438185029Spjd	(void) spa_vdev_state_exit(spa, NULL, 0);
4439168404Spjd
4440185029Spjd	/*
4441185029Spjd	 * Resume any suspended I/Os.
4442185029Spjd	 */
4443209962Smm	if (zio_resume(spa) != 0)
4444249195Smm		error = SET_ERROR(EIO);
4445185029Spjd
4446168404Spjd	spa_close(spa, FTAG);
4447168404Spjd
4448209962Smm	return (error);
4449168404Spjd}
4450168404Spjd
4451236155Smmstatic int
4452236155Smmzfs_ioc_pool_reopen(zfs_cmd_t *zc)
4453236155Smm{
4454236155Smm	spa_t *spa;
4455236155Smm	int error;
4456236155Smm
4457236155Smm	error = spa_open(zc->zc_name, &spa, FTAG);
4458248571Smm	if (error != 0)
4459236155Smm		return (error);
4460236155Smm
4461236155Smm	spa_vdev_state_enter(spa, SCL_NONE);
4462240133Smm
4463240133Smm	/*
4464240133Smm	 * If a resilver is already in progress then set the
4465240133Smm	 * spa_scrub_reopen flag to B_TRUE so that we don't restart
4466240133Smm	 * the scan as a side effect of the reopen. Otherwise, let
4467240133Smm	 * vdev_open() decided if a resilver is required.
4468240133Smm	 */
4469240133Smm	spa->spa_scrub_reopen = dsl_scan_resilvering(spa->spa_dsl_pool);
4470236155Smm	vdev_reopen(spa->spa_root_vdev);
4471240133Smm	spa->spa_scrub_reopen = B_FALSE;
4472240133Smm
4473236155Smm	(void) spa_vdev_state_exit(spa, NULL, 0);
4474236155Smm	spa_close(spa, FTAG);
4475236155Smm	return (0);
4476236155Smm}
4477185029Spjd/*
4478185029Spjd * inputs:
4479185029Spjd * zc_name	name of filesystem
4480185029Spjd * zc_value	name of origin snapshot
4481185029Spjd *
4482219089Spjd * outputs:
4483219089Spjd * zc_string	name of conflicting snapshot, if there is one
4484185029Spjd */
4485168404Spjdstatic int
4486168404Spjdzfs_ioc_promote(zfs_cmd_t *zc)
4487168404Spjd{
4488168404Spjd	char *cp;
4489168404Spjd
4490168404Spjd	/*
4491168404Spjd	 * We don't need to unmount *all* the origin fs's snapshots, but
4492168404Spjd	 * it's easier.
4493168404Spjd	 */
4494168404Spjd	cp = strchr(zc->zc_value, '@');
4495168404Spjd	if (cp)
4496168404Spjd		*cp = '\0';
4497168404Spjd	(void) dmu_objset_find(zc->zc_value,
4498248571Smm	    zfs_unmount_snap_cb, NULL, DS_FIND_SNAPSHOTS);
4499219089Spjd	return (dsl_dataset_promote(zc->zc_name, zc->zc_string));
4500168404Spjd}
4501168404Spjd
4502185029Spjd/*
4503209962Smm * Retrieve a single {user|group}{used|quota}@... property.
4504209962Smm *
4505209962Smm * inputs:
4506209962Smm * zc_name	name of filesystem
4507209962Smm * zc_objset_type zfs_userquota_prop_t
4508209962Smm * zc_value	domain name (eg. "S-1-234-567-89")
4509209962Smm * zc_guid	RID/UID/GID
4510209962Smm *
4511209962Smm * outputs:
4512209962Smm * zc_cookie	property value
4513209962Smm */
4514209962Smmstatic int
4515209962Smmzfs_ioc_userspace_one(zfs_cmd_t *zc)
4516209962Smm{
4517209962Smm	zfsvfs_t *zfsvfs;
4518209962Smm	int error;
4519209962Smm
4520209962Smm	if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
4521249195Smm		return (SET_ERROR(EINVAL));
4522209962Smm
4523219089Spjd	error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4524248571Smm	if (error != 0)
4525209962Smm		return (error);
4526209962Smm
4527209962Smm	error = zfs_userspace_one(zfsvfs,
4528209962Smm	    zc->zc_objset_type, zc->zc_value, zc->zc_guid, &zc->zc_cookie);
4529209962Smm	zfsvfs_rele(zfsvfs, FTAG);
4530209962Smm
4531209962Smm	return (error);
4532209962Smm}
4533209962Smm
4534209962Smm/*
4535209962Smm * inputs:
4536209962Smm * zc_name		name of filesystem
4537209962Smm * zc_cookie		zap cursor
4538209962Smm * zc_objset_type	zfs_userquota_prop_t
4539209962Smm * zc_nvlist_dst[_size] buffer to fill (not really an nvlist)
4540209962Smm *
4541209962Smm * outputs:
4542209962Smm * zc_nvlist_dst[_size]	data buffer (array of zfs_useracct_t)
4543209962Smm * zc_cookie	zap cursor
4544209962Smm */
4545209962Smmstatic int
4546209962Smmzfs_ioc_userspace_many(zfs_cmd_t *zc)
4547209962Smm{
4548209962Smm	zfsvfs_t *zfsvfs;
4549219089Spjd	int bufsize = zc->zc_nvlist_dst_size;
4550209962Smm
4551219089Spjd	if (bufsize <= 0)
4552249195Smm		return (SET_ERROR(ENOMEM));
4553219089Spjd
4554219089Spjd	int error = zfsvfs_hold(zc->zc_name, FTAG, &zfsvfs, B_FALSE);
4555248571Smm	if (error != 0)
4556209962Smm		return (error);
4557209962Smm
4558209962Smm	void *buf = kmem_alloc(bufsize, KM_SLEEP);
4559209962Smm
4560209962Smm	error = zfs_userspace_many(zfsvfs, zc->zc_objset_type, &zc->zc_cookie,
4561209962Smm	    buf, &zc->zc_nvlist_dst_size);
4562209962Smm
4563209962Smm	if (error == 0) {
4564221409Smarius		error = ddi_copyout(buf,
4565209962Smm		    (void *)(uintptr_t)zc->zc_nvlist_dst,
4566221409Smarius		    zc->zc_nvlist_dst_size, zc->zc_iflags);
4567209962Smm	}
4568209962Smm	kmem_free(buf, bufsize);
4569209962Smm	zfsvfs_rele(zfsvfs, FTAG);
4570209962Smm
4571209962Smm	return (error);
4572209962Smm}
4573209962Smm
4574209962Smm/*
4575209962Smm * inputs:
4576209962Smm * zc_name		name of filesystem
4577209962Smm *
4578209962Smm * outputs:
4579209962Smm * none
4580209962Smm */
4581209962Smmstatic int
4582209962Smmzfs_ioc_userspace_upgrade(zfs_cmd_t *zc)
4583209962Smm{
4584209962Smm	objset_t *os;
4585219089Spjd	int error = 0;
4586209962Smm	zfsvfs_t *zfsvfs;
4587209962Smm
4588209962Smm	if (getzfsvfs(zc->zc_name, &zfsvfs) == 0) {
4589219089Spjd		if (!dmu_objset_userused_enabled(zfsvfs->z_os)) {
4590209962Smm			/*
4591209962Smm			 * If userused is not enabled, it may be because the
4592209962Smm			 * objset needs to be closed & reopened (to grow the
4593209962Smm			 * objset_phys_t).  Suspend/resume the fs will do that.
4594209962Smm			 */
4595219089Spjd			error = zfs_suspend_fs(zfsvfs);
4596219089Spjd			if (error == 0)
4597219089Spjd				error = zfs_resume_fs(zfsvfs, zc->zc_name);
4598209962Smm		}
4599209962Smm		if (error == 0)
4600209962Smm			error = dmu_objset_userspace_upgrade(zfsvfs->z_os);
4601209962Smm		VFS_RELE(zfsvfs->z_vfs);
4602209962Smm	} else {
4603219089Spjd		/* XXX kind of reading contents without owning */
4604219089Spjd		error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4605248571Smm		if (error != 0)
4606209962Smm			return (error);
4607209962Smm
4608209962Smm		error = dmu_objset_userspace_upgrade(os);
4609219089Spjd		dmu_objset_rele(os, FTAG);
4610209962Smm	}
4611209962Smm
4612209962Smm	return (error);
4613209962Smm}
4614209962Smm
4615209962Smm#ifdef sun
4616209962Smm/*
4617185029Spjd * We don't want to have a hard dependency
4618185029Spjd * against some special symbols in sharefs
4619185029Spjd * nfs, and smbsrv.  Determine them if needed when
4620185029Spjd * the first file system is shared.
4621185029Spjd * Neither sharefs, nfs or smbsrv are unloadable modules.
4622185029Spjd */
4623185029Spjdint (*znfsexport_fs)(void *arg);
4624185029Spjdint (*zshare_fs)(enum sharefs_sys_op, share_t *, uint32_t);
4625185029Spjdint (*zsmbexport_fs)(void *arg, boolean_t add_share);
4626185029Spjd
4627185029Spjdint zfs_nfsshare_inited;
4628185029Spjdint zfs_smbshare_inited;
4629185029Spjd
4630185029Spjdddi_modhandle_t nfs_mod;
4631185029Spjdddi_modhandle_t sharefs_mod;
4632185029Spjdddi_modhandle_t smbsrv_mod;
4633209962Smm#endif	/* sun */
4634185029Spjdkmutex_t zfs_share_lock;
4635185029Spjd
4636209962Smm#ifdef sun
4637168404Spjdstatic int
4638185029Spjdzfs_init_sharefs()
4639185029Spjd{
4640185029Spjd	int error;
4641185029Spjd
4642185029Spjd	ASSERT(MUTEX_HELD(&zfs_share_lock));
4643185029Spjd	/* Both NFS and SMB shares also require sharetab support. */
4644185029Spjd	if (sharefs_mod == NULL && ((sharefs_mod =
4645185029Spjd	    ddi_modopen("fs/sharefs",
4646185029Spjd	    KRTLD_MODE_FIRST, &error)) == NULL)) {
4647249195Smm		return (SET_ERROR(ENOSYS));
4648185029Spjd	}
4649185029Spjd	if (zshare_fs == NULL && ((zshare_fs =
4650185029Spjd	    (int (*)(enum sharefs_sys_op, share_t *, uint32_t))
4651185029Spjd	    ddi_modsym(sharefs_mod, "sharefs_impl", &error)) == NULL)) {
4652249195Smm		return (SET_ERROR(ENOSYS));
4653185029Spjd	}
4654185029Spjd	return (0);
4655185029Spjd}
4656219089Spjd#endif	/* sun */
4657185029Spjd
4658185029Spjdstatic int
4659185029Spjdzfs_ioc_share(zfs_cmd_t *zc)
4660185029Spjd{
4661209962Smm#ifdef sun
4662185029Spjd	int error;
4663185029Spjd	int opcode;
4664185029Spjd
4665185029Spjd	switch (zc->zc_share.z_sharetype) {
4666185029Spjd	case ZFS_SHARE_NFS:
4667185029Spjd	case ZFS_UNSHARE_NFS:
4668185029Spjd		if (zfs_nfsshare_inited == 0) {
4669185029Spjd			mutex_enter(&zfs_share_lock);
4670185029Spjd			if (nfs_mod == NULL && ((nfs_mod = ddi_modopen("fs/nfs",
4671185029Spjd			    KRTLD_MODE_FIRST, &error)) == NULL)) {
4672185029Spjd				mutex_exit(&zfs_share_lock);
4673249195Smm				return (SET_ERROR(ENOSYS));
4674185029Spjd			}
4675185029Spjd			if (znfsexport_fs == NULL &&
4676185029Spjd			    ((znfsexport_fs = (int (*)(void *))
4677185029Spjd			    ddi_modsym(nfs_mod,
4678185029Spjd			    "nfs_export", &error)) == NULL)) {
4679185029Spjd				mutex_exit(&zfs_share_lock);
4680249195Smm				return (SET_ERROR(ENOSYS));
4681185029Spjd			}
4682185029Spjd			error = zfs_init_sharefs();
4683248571Smm			if (error != 0) {
4684185029Spjd				mutex_exit(&zfs_share_lock);
4685249195Smm				return (SET_ERROR(ENOSYS));
4686185029Spjd			}
4687185029Spjd			zfs_nfsshare_inited = 1;
4688185029Spjd			mutex_exit(&zfs_share_lock);
4689185029Spjd		}
4690185029Spjd		break;
4691185029Spjd	case ZFS_SHARE_SMB:
4692185029Spjd	case ZFS_UNSHARE_SMB:
4693185029Spjd		if (zfs_smbshare_inited == 0) {
4694185029Spjd			mutex_enter(&zfs_share_lock);
4695185029Spjd			if (smbsrv_mod == NULL && ((smbsrv_mod =
4696185029Spjd			    ddi_modopen("drv/smbsrv",
4697185029Spjd			    KRTLD_MODE_FIRST, &error)) == NULL)) {
4698185029Spjd				mutex_exit(&zfs_share_lock);
4699249195Smm				return (SET_ERROR(ENOSYS));
4700185029Spjd			}
4701185029Spjd			if (zsmbexport_fs == NULL && ((zsmbexport_fs =
4702185029Spjd			    (int (*)(void *, boolean_t))ddi_modsym(smbsrv_mod,
4703185029Spjd			    "smb_server_share", &error)) == NULL)) {
4704185029Spjd				mutex_exit(&zfs_share_lock);
4705249195Smm				return (SET_ERROR(ENOSYS));
4706185029Spjd			}
4707185029Spjd			error = zfs_init_sharefs();
4708248571Smm			if (error != 0) {
4709185029Spjd				mutex_exit(&zfs_share_lock);
4710249195Smm				return (SET_ERROR(ENOSYS));
4711185029Spjd			}
4712185029Spjd			zfs_smbshare_inited = 1;
4713185029Spjd			mutex_exit(&zfs_share_lock);
4714185029Spjd		}
4715185029Spjd		break;
4716185029Spjd	default:
4717249195Smm		return (SET_ERROR(EINVAL));
4718185029Spjd	}
4719185029Spjd
4720185029Spjd	switch (zc->zc_share.z_sharetype) {
4721185029Spjd	case ZFS_SHARE_NFS:
4722185029Spjd	case ZFS_UNSHARE_NFS:
4723185029Spjd		if (error =
4724185029Spjd		    znfsexport_fs((void *)
4725185029Spjd		    (uintptr_t)zc->zc_share.z_exportdata))
4726185029Spjd			return (error);
4727185029Spjd		break;
4728185029Spjd	case ZFS_SHARE_SMB:
4729185029Spjd	case ZFS_UNSHARE_SMB:
4730185029Spjd		if (error = zsmbexport_fs((void *)
4731185029Spjd		    (uintptr_t)zc->zc_share.z_exportdata,
4732185029Spjd		    zc->zc_share.z_sharetype == ZFS_SHARE_SMB ?
4733209962Smm		    B_TRUE: B_FALSE)) {
4734185029Spjd			return (error);
4735185029Spjd		}
4736185029Spjd		break;
4737185029Spjd	}
4738185029Spjd
4739185029Spjd	opcode = (zc->zc_share.z_sharetype == ZFS_SHARE_NFS ||
4740185029Spjd	    zc->zc_share.z_sharetype == ZFS_SHARE_SMB) ?
4741185029Spjd	    SHAREFS_ADD : SHAREFS_REMOVE;
4742185029Spjd
4743185029Spjd	/*
4744185029Spjd	 * Add or remove share from sharetab
4745185029Spjd	 */
4746185029Spjd	error = zshare_fs(opcode,
4747185029Spjd	    (void *)(uintptr_t)zc->zc_share.z_sharedata,
4748185029Spjd	    zc->zc_share.z_sharemax);
4749185029Spjd
4750185029Spjd	return (error);
4751219089Spjd
4752219089Spjd#else	/* !sun */
4753185029Spjd	return (ENOSYS);
4754219089Spjd#endif	/* !sun */
4755185029Spjd}
4756185029Spjd
4757209962Smmace_t full_access[] = {
4758209962Smm	{(uid_t)-1, ACE_ALL_PERMS, ACE_EVERYONE, 0}
4759209962Smm};
4760209962Smm
4761219089Spjd/*
4762219089Spjd * inputs:
4763219089Spjd * zc_name		name of containing filesystem
4764219089Spjd * zc_obj		object # beyond which we want next in-use object #
4765219089Spjd *
4766219089Spjd * outputs:
4767219089Spjd * zc_obj		next in-use object #
4768219089Spjd */
4769219089Spjdstatic int
4770219089Spjdzfs_ioc_next_obj(zfs_cmd_t *zc)
4771219089Spjd{
4772219089Spjd	objset_t *os = NULL;
4773219089Spjd	int error;
4774219089Spjd
4775219089Spjd	error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4776248571Smm	if (error != 0)
4777219089Spjd		return (error);
4778219089Spjd
4779219089Spjd	error = dmu_object_next(os, &zc->zc_obj, B_FALSE,
4780219089Spjd	    os->os_dsl_dataset->ds_phys->ds_prev_snap_txg);
4781219089Spjd
4782219089Spjd	dmu_objset_rele(os, FTAG);
4783219089Spjd	return (error);
4784219089Spjd}
4785219089Spjd
4786219089Spjd/*
4787219089Spjd * inputs:
4788219089Spjd * zc_name		name of filesystem
4789219089Spjd * zc_value		prefix name for snapshot
4790219089Spjd * zc_cleanup_fd	cleanup-on-exit file descriptor for calling process
4791219089Spjd *
4792219089Spjd * outputs:
4793248571Smm * zc_value		short name of new snapshot
4794219089Spjd */
4795219089Spjdstatic int
4796219089Spjdzfs_ioc_tmp_snapshot(zfs_cmd_t *zc)
4797219089Spjd{
4798219089Spjd	char *snap_name;
4799248571Smm	char *hold_name;
4800219089Spjd	int error;
4801248571Smm	minor_t minor;
4802219089Spjd
4803248571Smm	error = zfs_onexit_fd_hold(zc->zc_cleanup_fd, &minor);
4804248571Smm	if (error != 0)
4805248571Smm		return (error);
4806248571Smm
4807219089Spjd	snap_name = kmem_asprintf("%s-%016llx", zc->zc_value,
4808219089Spjd	    (u_longlong_t)ddi_get_lbolt64());
4809248571Smm	hold_name = kmem_asprintf("%%%s", zc->zc_value);
4810219089Spjd
4811248571Smm	error = dsl_dataset_snapshot_tmp(zc->zc_name, snap_name, minor,
4812248571Smm	    hold_name);
4813248571Smm	if (error == 0)
4814248571Smm		(void) strcpy(zc->zc_value, snap_name);
4815219089Spjd	strfree(snap_name);
4816248571Smm	strfree(hold_name);
4817248571Smm	zfs_onexit_fd_rele(zc->zc_cleanup_fd);
4818248571Smm	return (error);
4819219089Spjd}
4820219089Spjd
4821219089Spjd/*
4822219089Spjd * inputs:
4823219089Spjd * zc_name		name of "to" snapshot
4824219089Spjd * zc_value		name of "from" snapshot
4825219089Spjd * zc_cookie		file descriptor to write diff data on
4826219089Spjd *
4827219089Spjd * outputs:
4828219089Spjd * dmu_diff_record_t's to the file descriptor
4829219089Spjd */
4830219089Spjdstatic int
4831219089Spjdzfs_ioc_diff(zfs_cmd_t *zc)
4832219089Spjd{
4833219089Spjd	file_t *fp;
4834219089Spjd	offset_t off;
4835219089Spjd	int error;
4836219089Spjd
4837247602Spjd	fp = getf(zc->zc_cookie, CAP_WRITE);
4838248571Smm	if (fp == NULL)
4839249195Smm		return (SET_ERROR(EBADF));
4840219089Spjd
4841219089Spjd	off = fp->f_offset;
4842219089Spjd
4843248571Smm#ifdef illumos
4844248571Smm	error = dmu_diff(zc->zc_name, zc->zc_value, fp->f_vnode, &off);
4845248571Smm#else
4846248571Smm	error = dmu_diff(zc->zc_name, zc->zc_value, fp, &off);
4847248571Smm#endif
4848219089Spjd
4849219089Spjd	if (off >= 0 && off <= MAXOFFSET_T)
4850219089Spjd		fp->f_offset = off;
4851219089Spjd	releasef(zc->zc_cookie);
4852219089Spjd
4853219089Spjd	return (error);
4854219089Spjd}
4855219089Spjd
4856209962Smm#ifdef sun
4857185029Spjd/*
4858209962Smm * Remove all ACL files in shares dir
4859209962Smm */
4860209962Smmstatic int
4861209962Smmzfs_smb_acl_purge(znode_t *dzp)
4862209962Smm{
4863209962Smm	zap_cursor_t	zc;
4864209962Smm	zap_attribute_t	zap;
4865209962Smm	zfsvfs_t *zfsvfs = dzp->z_zfsvfs;
4866209962Smm	int error;
4867209962Smm
4868209962Smm	for (zap_cursor_init(&zc, zfsvfs->z_os, dzp->z_id);
4869209962Smm	    (error = zap_cursor_retrieve(&zc, &zap)) == 0;
4870209962Smm	    zap_cursor_advance(&zc)) {
4871209962Smm		if ((error = VOP_REMOVE(ZTOV(dzp), zap.za_name, kcred,
4872209962Smm		    NULL, 0)) != 0)
4873209962Smm			break;
4874209962Smm	}
4875209962Smm	zap_cursor_fini(&zc);
4876209962Smm	return (error);
4877209962Smm}
4878209962Smm#endif	/* sun */
4879209962Smm
4880209962Smmstatic int
4881209962Smmzfs_ioc_smb_acl(zfs_cmd_t *zc)
4882209962Smm{
4883209962Smm#ifdef sun
4884209962Smm	vnode_t *vp;
4885209962Smm	znode_t *dzp;
4886209962Smm	vnode_t *resourcevp = NULL;
4887209962Smm	znode_t *sharedir;
4888209962Smm	zfsvfs_t *zfsvfs;
4889209962Smm	nvlist_t *nvlist;
4890209962Smm	char *src, *target;
4891209962Smm	vattr_t vattr;
4892209962Smm	vsecattr_t vsec;
4893209962Smm	int error = 0;
4894209962Smm
4895209962Smm	if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
4896209962Smm	    NO_FOLLOW, NULL, &vp)) != 0)
4897209962Smm		return (error);
4898209962Smm
4899209962Smm	/* Now make sure mntpnt and dataset are ZFS */
4900209962Smm
4901219089Spjd	if (strcmp(vp->v_vfsp->mnt_stat.f_fstypename, "zfs") != 0 ||
4902209962Smm	    (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
4903209962Smm	    zc->zc_name) != 0)) {
4904209962Smm		VN_RELE(vp);
4905249195Smm		return (SET_ERROR(EINVAL));
4906209962Smm	}
4907209962Smm
4908209962Smm	dzp = VTOZ(vp);
4909209962Smm	zfsvfs = dzp->z_zfsvfs;
4910209962Smm	ZFS_ENTER(zfsvfs);
4911209962Smm
4912209962Smm	/*
4913209962Smm	 * Create share dir if its missing.
4914209962Smm	 */
4915209962Smm	mutex_enter(&zfsvfs->z_lock);
4916209962Smm	if (zfsvfs->z_shares_dir == 0) {
4917209962Smm		dmu_tx_t *tx;
4918209962Smm
4919209962Smm		tx = dmu_tx_create(zfsvfs->z_os);
4920209962Smm		dmu_tx_hold_zap(tx, MASTER_NODE_OBJ, TRUE,
4921209962Smm		    ZFS_SHARES_DIR);
4922209962Smm		dmu_tx_hold_zap(tx, DMU_NEW_OBJECT, FALSE, NULL);
4923209962Smm		error = dmu_tx_assign(tx, TXG_WAIT);
4924248571Smm		if (error != 0) {
4925209962Smm			dmu_tx_abort(tx);
4926209962Smm		} else {
4927209962Smm			error = zfs_create_share_dir(zfsvfs, tx);
4928209962Smm			dmu_tx_commit(tx);
4929209962Smm		}
4930248571Smm		if (error != 0) {
4931209962Smm			mutex_exit(&zfsvfs->z_lock);
4932209962Smm			VN_RELE(vp);
4933209962Smm			ZFS_EXIT(zfsvfs);
4934209962Smm			return (error);
4935209962Smm		}
4936209962Smm	}
4937209962Smm	mutex_exit(&zfsvfs->z_lock);
4938209962Smm
4939209962Smm	ASSERT(zfsvfs->z_shares_dir);
4940209962Smm	if ((error = zfs_zget(zfsvfs, zfsvfs->z_shares_dir, &sharedir)) != 0) {
4941209962Smm		VN_RELE(vp);
4942209962Smm		ZFS_EXIT(zfsvfs);
4943209962Smm		return (error);
4944209962Smm	}
4945209962Smm
4946209962Smm	switch (zc->zc_cookie) {
4947209962Smm	case ZFS_SMB_ACL_ADD:
4948209962Smm		vattr.va_mask = AT_MODE|AT_UID|AT_GID|AT_TYPE;
4949209962Smm		vattr.va_type = VREG;
4950209962Smm		vattr.va_mode = S_IFREG|0777;
4951209962Smm		vattr.va_uid = 0;
4952209962Smm		vattr.va_gid = 0;
4953209962Smm
4954209962Smm		vsec.vsa_mask = VSA_ACE;
4955209962Smm		vsec.vsa_aclentp = &full_access;
4956209962Smm		vsec.vsa_aclentsz = sizeof (full_access);
4957209962Smm		vsec.vsa_aclcnt = 1;
4958209962Smm
4959209962Smm		error = VOP_CREATE(ZTOV(sharedir), zc->zc_string,
4960209962Smm		    &vattr, EXCL, 0, &resourcevp, kcred, 0, NULL, &vsec);
4961209962Smm		if (resourcevp)
4962209962Smm			VN_RELE(resourcevp);
4963209962Smm		break;
4964209962Smm
4965209962Smm	case ZFS_SMB_ACL_REMOVE:
4966209962Smm		error = VOP_REMOVE(ZTOV(sharedir), zc->zc_string, kcred,
4967209962Smm		    NULL, 0);
4968209962Smm		break;
4969209962Smm
4970209962Smm	case ZFS_SMB_ACL_RENAME:
4971209962Smm		if ((error = get_nvlist(zc->zc_nvlist_src,
4972219089Spjd		    zc->zc_nvlist_src_size, zc->zc_iflags, &nvlist)) != 0) {
4973209962Smm			VN_RELE(vp);
4974209962Smm			ZFS_EXIT(zfsvfs);
4975209962Smm			return (error);
4976209962Smm		}
4977209962Smm		if (nvlist_lookup_string(nvlist, ZFS_SMB_ACL_SRC, &src) ||
4978209962Smm		    nvlist_lookup_string(nvlist, ZFS_SMB_ACL_TARGET,
4979209962Smm		    &target)) {
4980209962Smm			VN_RELE(vp);
4981209962Smm			VN_RELE(ZTOV(sharedir));
4982209962Smm			ZFS_EXIT(zfsvfs);
4983219089Spjd			nvlist_free(nvlist);
4984209962Smm			return (error);
4985209962Smm		}
4986209962Smm		error = VOP_RENAME(ZTOV(sharedir), src, ZTOV(sharedir), target,
4987209962Smm		    kcred, NULL, 0);
4988209962Smm		nvlist_free(nvlist);
4989209962Smm		break;
4990209962Smm
4991209962Smm	case ZFS_SMB_ACL_PURGE:
4992209962Smm		error = zfs_smb_acl_purge(sharedir);
4993209962Smm		break;
4994209962Smm
4995209962Smm	default:
4996249195Smm		error = SET_ERROR(EINVAL);
4997209962Smm		break;
4998209962Smm	}
4999209962Smm
5000209962Smm	VN_RELE(vp);
5001209962Smm	VN_RELE(ZTOV(sharedir));
5002209962Smm
5003209962Smm	ZFS_EXIT(zfsvfs);
5004209962Smm
5005209962Smm	return (error);
5006209962Smm#else	/* !sun */
5007209962Smm	return (EOPNOTSUPP);
5008209962Smm#endif	/* !sun */
5009209962Smm}
5010209962Smm
5011209962Smm/*
5012248571Smm * innvl: {
5013248571Smm *     "holds" -> { snapname -> holdname (string), ... }
5014248571Smm *     (optional) "cleanup_fd" -> fd (int32)
5015248571Smm * }
5016219089Spjd *
5017248571Smm * outnvl: {
5018248571Smm *     snapname -> error value (int32)
5019248571Smm *     ...
5020248571Smm * }
5021219089Spjd */
5022248571Smm/* ARGSUSED */
5023219089Spjdstatic int
5024248571Smmzfs_ioc_hold(const char *pool, nvlist_t *args, nvlist_t *errlist)
5025219089Spjd{
5026248571Smm	nvlist_t *holds;
5027248571Smm	int cleanup_fd = -1;
5028219089Spjd	int error;
5029219089Spjd	minor_t minor = 0;
5030219089Spjd
5031248571Smm	error = nvlist_lookup_nvlist(args, "holds", &holds);
5032248571Smm	if (error != 0)
5033249195Smm		return (SET_ERROR(EINVAL));
5034219089Spjd
5035248571Smm	if (nvlist_lookup_int32(args, "cleanup_fd", &cleanup_fd) == 0) {
5036248571Smm		error = zfs_onexit_fd_hold(cleanup_fd, &minor);
5037248571Smm		if (error != 0)
5038219089Spjd			return (error);
5039219089Spjd	}
5040219089Spjd
5041248571Smm	error = dsl_dataset_user_hold(holds, minor, errlist);
5042248571Smm	if (minor != 0)
5043248571Smm		zfs_onexit_fd_rele(cleanup_fd);
5044219089Spjd	return (error);
5045219089Spjd}
5046219089Spjd
5047219089Spjd/*
5048248571Smm * innvl is not used.
5049219089Spjd *
5050248571Smm * outnvl: {
5051248571Smm *    holdname -> time added (uint64 seconds since epoch)
5052248571Smm *    ...
5053248571Smm * }
5054219089Spjd */
5055248571Smm/* ARGSUSED */
5056219089Spjdstatic int
5057248571Smmzfs_ioc_get_holds(const char *snapname, nvlist_t *args, nvlist_t *outnvl)
5058219089Spjd{
5059248571Smm	return (dsl_dataset_get_holds(snapname, outnvl));
5060219089Spjd}
5061219089Spjd
5062219089Spjd/*
5063248571Smm * innvl: {
5064248571Smm *     snapname -> { holdname, ... }
5065248571Smm *     ...
5066248571Smm * }
5067219089Spjd *
5068248571Smm * outnvl: {
5069248571Smm *     snapname -> error value (int32)
5070248571Smm *     ...
5071248571Smm * }
5072219089Spjd */
5073248571Smm/* ARGSUSED */
5074219089Spjdstatic int
5075248571Smmzfs_ioc_release(const char *pool, nvlist_t *holds, nvlist_t *errlist)
5076219089Spjd{
5077248571Smm	nvpair_t *pair;
5078219089Spjd
5079248571Smm	/*
5080248571Smm	 * The release may cause the snapshot to be destroyed; make sure it
5081248571Smm	 * is not mounted.
5082248571Smm	 */
5083248571Smm	for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
5084248571Smm	    pair = nvlist_next_nvpair(holds, pair))
5085248571Smm		zfs_unmount_snap(nvpair_name(pair));
5086219089Spjd
5087248571Smm	return (dsl_dataset_user_release(holds, errlist));
5088219089Spjd}
5089219089Spjd
5090219089Spjd/*
5091228103Smm * inputs:
5092228103Smm * zc_name		name of new filesystem or snapshot
5093228103Smm * zc_value		full name of old snapshot
5094228103Smm *
5095228103Smm * outputs:
5096228103Smm * zc_cookie		space in bytes
5097228103Smm * zc_objset_type	compressed space in bytes
5098228103Smm * zc_perm_action	uncompressed space in bytes
5099228103Smm */
5100228103Smmstatic int
5101228103Smmzfs_ioc_space_written(zfs_cmd_t *zc)
5102228103Smm{
5103228103Smm	int error;
5104248571Smm	dsl_pool_t *dp;
5105228103Smm	dsl_dataset_t *new, *old;
5106228103Smm
5107248571Smm	error = dsl_pool_hold(zc->zc_name, FTAG, &dp);
5108228103Smm	if (error != 0)
5109228103Smm		return (error);
5110248571Smm	error = dsl_dataset_hold(dp, zc->zc_name, FTAG, &new);
5111228103Smm	if (error != 0) {
5112248571Smm		dsl_pool_rele(dp, FTAG);
5113248571Smm		return (error);
5114248571Smm	}
5115248571Smm	error = dsl_dataset_hold(dp, zc->zc_value, FTAG, &old);
5116248571Smm	if (error != 0) {
5117228103Smm		dsl_dataset_rele(new, FTAG);
5118248571Smm		dsl_pool_rele(dp, FTAG);
5119228103Smm		return (error);
5120228103Smm	}
5121228103Smm
5122228103Smm	error = dsl_dataset_space_written(old, new, &zc->zc_cookie,
5123228103Smm	    &zc->zc_objset_type, &zc->zc_perm_action);
5124228103Smm	dsl_dataset_rele(old, FTAG);
5125228103Smm	dsl_dataset_rele(new, FTAG);
5126248571Smm	dsl_pool_rele(dp, FTAG);
5127228103Smm	return (error);
5128228103Smm}
5129228103Smm
5130228103Smm/*
5131248571Smm * innvl: {
5132248571Smm *     "firstsnap" -> snapshot name
5133248571Smm * }
5134228103Smm *
5135248571Smm * outnvl: {
5136248571Smm *     "used" -> space in bytes
5137248571Smm *     "compressed" -> compressed space in bytes
5138248571Smm *     "uncompressed" -> uncompressed space in bytes
5139248571Smm * }
5140228103Smm */
5141228103Smmstatic int
5142248571Smmzfs_ioc_space_snaps(const char *lastsnap, nvlist_t *innvl, nvlist_t *outnvl)
5143228103Smm{
5144228103Smm	int error;
5145248571Smm	dsl_pool_t *dp;
5146228103Smm	dsl_dataset_t *new, *old;
5147248571Smm	char *firstsnap;
5148248571Smm	uint64_t used, comp, uncomp;
5149228103Smm
5150248571Smm	if (nvlist_lookup_string(innvl, "firstsnap", &firstsnap) != 0)
5151249195Smm		return (SET_ERROR(EINVAL));
5152248571Smm
5153248571Smm	error = dsl_pool_hold(lastsnap, FTAG, &dp);
5154228103Smm	if (error != 0)
5155228103Smm		return (error);
5156248571Smm
5157248571Smm	error = dsl_dataset_hold(dp, lastsnap, FTAG, &new);
5158228103Smm	if (error != 0) {
5159248571Smm		dsl_pool_rele(dp, FTAG);
5160248571Smm		return (error);
5161248571Smm	}
5162248571Smm	error = dsl_dataset_hold(dp, firstsnap, FTAG, &old);
5163248571Smm	if (error != 0) {
5164228103Smm		dsl_dataset_rele(new, FTAG);
5165248571Smm		dsl_pool_rele(dp, FTAG);
5166228103Smm		return (error);
5167228103Smm	}
5168228103Smm
5169248571Smm	error = dsl_dataset_space_wouldfree(old, new, &used, &comp, &uncomp);
5170228103Smm	dsl_dataset_rele(old, FTAG);
5171228103Smm	dsl_dataset_rele(new, FTAG);
5172248571Smm	dsl_pool_rele(dp, FTAG);
5173248571Smm	fnvlist_add_uint64(outnvl, "used", used);
5174248571Smm	fnvlist_add_uint64(outnvl, "compressed", comp);
5175248571Smm	fnvlist_add_uint64(outnvl, "uncompressed", uncomp);
5176228103Smm	return (error);
5177228103Smm}
5178228103Smm
5179185029Spjdstatic int
5180168404Spjdzfs_ioc_jail(zfs_cmd_t *zc)
5181168404Spjd{
5182168404Spjd
5183185029Spjd	return (zone_dataset_attach(curthread->td_ucred, zc->zc_name,
5184185029Spjd	    (int)zc->zc_jailid));
5185168404Spjd}
5186168404Spjd
5187168404Spjdstatic int
5188168404Spjdzfs_ioc_unjail(zfs_cmd_t *zc)
5189168404Spjd{
5190168404Spjd
5191185029Spjd	return (zone_dataset_detach(curthread->td_ucred, zc->zc_name,
5192185029Spjd	    (int)zc->zc_jailid));
5193168404Spjd}
5194168404Spjd
5195248571Smm/*
5196248571Smm * innvl: {
5197248571Smm *     "fd" -> file descriptor to write stream to (int32)
5198248571Smm *     (optional) "fromsnap" -> full snap name to send an incremental from
5199248571Smm * }
5200248571Smm *
5201248571Smm * outnvl is unused
5202248571Smm */
5203248571Smm/* ARGSUSED */
5204248571Smmstatic int
5205248571Smmzfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5206248571Smm{
5207248571Smm	int error;
5208248571Smm	offset_t off;
5209248571Smm	char *fromname = NULL;
5210248571Smm	int fd;
5211168404Spjd
5212248571Smm	error = nvlist_lookup_int32(innvl, "fd", &fd);
5213248571Smm	if (error != 0)
5214249195Smm		return (SET_ERROR(EINVAL));
5215248571Smm
5216248571Smm	(void) nvlist_lookup_string(innvl, "fromsnap", &fromname);
5217248571Smm
5218248571Smm	file_t *fp = getf(fd, CAP_READ);
5219248571Smm	if (fp == NULL)
5220249195Smm		return (SET_ERROR(EBADF));
5221248571Smm
5222248571Smm	off = fp->f_offset;
5223248571Smm#ifdef illumos
5224248571Smm	error = dmu_send(snapname, fromname, fd, fp->f_vnode, &off);
5225248571Smm#else
5226248571Smm	error = dmu_send(snapname, fromname, fd, fp, &off);
5227248571Smm#endif
5228248571Smm
5229248571Smm#ifdef illumos
5230248571Smm	if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
5231248571Smm		fp->f_offset = off;
5232248571Smm#else
5233248571Smm	fp->f_offset = off;
5234248571Smm#endif
5235248571Smm
5236248571Smm	releasef(fd);
5237248571Smm	return (error);
5238248571Smm}
5239248571Smm
5240248571Smm/*
5241248571Smm * Determine approximately how large a zfs send stream will be -- the number
5242248571Smm * of bytes that will be written to the fd supplied to zfs_ioc_send_new().
5243248571Smm *
5244248571Smm * innvl: {
5245248571Smm *     (optional) "fromsnap" -> full snap name to send an incremental from
5246248571Smm * }
5247248571Smm *
5248248571Smm * outnvl: {
5249248571Smm *     "space" -> bytes of space (uint64)
5250248571Smm * }
5251248571Smm */
5252248571Smmstatic int
5253248571Smmzfs_ioc_send_space(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
5254248571Smm{
5255248571Smm	dsl_pool_t *dp;
5256248571Smm	dsl_dataset_t *fromsnap = NULL;
5257248571Smm	dsl_dataset_t *tosnap;
5258248571Smm	int error;
5259248571Smm	char *fromname;
5260248571Smm	uint64_t space;
5261248571Smm
5262248571Smm	error = dsl_pool_hold(snapname, FTAG, &dp);
5263248571Smm	if (error != 0)
5264248571Smm		return (error);
5265248571Smm
5266248571Smm	error = dsl_dataset_hold(dp, snapname, FTAG, &tosnap);
5267248571Smm	if (error != 0) {
5268248571Smm		dsl_pool_rele(dp, FTAG);
5269248571Smm		return (error);
5270248571Smm	}
5271248571Smm
5272248571Smm	error = nvlist_lookup_string(innvl, "fromsnap", &fromname);
5273248571Smm	if (error == 0) {
5274248571Smm		error = dsl_dataset_hold(dp, fromname, FTAG, &fromsnap);
5275248571Smm		if (error != 0) {
5276248571Smm			dsl_dataset_rele(tosnap, FTAG);
5277248571Smm			dsl_pool_rele(dp, FTAG);
5278248571Smm			return (error);
5279248571Smm		}
5280248571Smm	}
5281248571Smm
5282248571Smm	error = dmu_send_estimate(tosnap, fromsnap, &space);
5283248571Smm	fnvlist_add_uint64(outnvl, "space", space);
5284248571Smm
5285248571Smm	if (fromsnap != NULL)
5286248571Smm		dsl_dataset_rele(fromsnap, FTAG);
5287248571Smm	dsl_dataset_rele(tosnap, FTAG);
5288248571Smm	dsl_pool_rele(dp, FTAG);
5289248571Smm	return (error);
5290248571Smm}
5291248571Smm
5292248571Smm
5293248571Smmstatic zfs_ioc_vec_t zfs_ioc_vec[ZFS_IOC_LAST - ZFS_IOC_FIRST];
5294248571Smm
5295248571Smmstatic void
5296248571Smmzfs_ioctl_register_legacy(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5297248571Smm    zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5298248571Smm    boolean_t log_history, zfs_ioc_poolcheck_t pool_check)
5299248571Smm{
5300248571Smm	zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5301248571Smm
5302248571Smm	ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5303248571Smm	ASSERT3U(ioc, <, ZFS_IOC_LAST);
5304248571Smm	ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5305248571Smm	ASSERT3P(vec->zvec_func, ==, NULL);
5306248571Smm
5307248571Smm	vec->zvec_legacy_func = func;
5308248571Smm	vec->zvec_secpolicy = secpolicy;
5309248571Smm	vec->zvec_namecheck = namecheck;
5310248571Smm	vec->zvec_allow_log = log_history;
5311248571Smm	vec->zvec_pool_check = pool_check;
5312248571Smm}
5313248571Smm
5314248571Smm/*
5315248571Smm * See the block comment at the beginning of this file for details on
5316248571Smm * each argument to this function.
5317248571Smm */
5318248571Smmstatic void
5319248571Smmzfs_ioctl_register(const char *name, zfs_ioc_t ioc, zfs_ioc_func_t *func,
5320248571Smm    zfs_secpolicy_func_t *secpolicy, zfs_ioc_namecheck_t namecheck,
5321248571Smm    zfs_ioc_poolcheck_t pool_check, boolean_t smush_outnvlist,
5322248571Smm    boolean_t allow_log)
5323248571Smm{
5324248571Smm	zfs_ioc_vec_t *vec = &zfs_ioc_vec[ioc - ZFS_IOC_FIRST];
5325248571Smm
5326248571Smm	ASSERT3U(ioc, >=, ZFS_IOC_FIRST);
5327248571Smm	ASSERT3U(ioc, <, ZFS_IOC_LAST);
5328248571Smm	ASSERT3P(vec->zvec_legacy_func, ==, NULL);
5329248571Smm	ASSERT3P(vec->zvec_func, ==, NULL);
5330248571Smm
5331248571Smm	/* if we are logging, the name must be valid */
5332248571Smm	ASSERT(!allow_log || namecheck != NO_NAME);
5333248571Smm
5334248571Smm	vec->zvec_name = name;
5335248571Smm	vec->zvec_func = func;
5336248571Smm	vec->zvec_secpolicy = secpolicy;
5337248571Smm	vec->zvec_namecheck = namecheck;
5338248571Smm	vec->zvec_pool_check = pool_check;
5339248571Smm	vec->zvec_smush_outnvlist = smush_outnvlist;
5340248571Smm	vec->zvec_allow_log = allow_log;
5341248571Smm}
5342248571Smm
5343248571Smmstatic void
5344248571Smmzfs_ioctl_register_pool(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5345248571Smm    zfs_secpolicy_func_t *secpolicy, boolean_t log_history,
5346248571Smm    zfs_ioc_poolcheck_t pool_check)
5347248571Smm{
5348248571Smm	zfs_ioctl_register_legacy(ioc, func, secpolicy,
5349248571Smm	    POOL_NAME, log_history, pool_check);
5350248571Smm}
5351248571Smm
5352248571Smmstatic void
5353248571Smmzfs_ioctl_register_dataset_nolog(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5354248571Smm    zfs_secpolicy_func_t *secpolicy, zfs_ioc_poolcheck_t pool_check)
5355248571Smm{
5356248571Smm	zfs_ioctl_register_legacy(ioc, func, secpolicy,
5357248571Smm	    DATASET_NAME, B_FALSE, pool_check);
5358248571Smm}
5359248571Smm
5360248571Smmstatic void
5361248571Smmzfs_ioctl_register_pool_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5362248571Smm{
5363248571Smm	zfs_ioctl_register_legacy(ioc, func, zfs_secpolicy_config,
5364248571Smm	    POOL_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5365248571Smm}
5366248571Smm
5367248571Smmstatic void
5368248571Smmzfs_ioctl_register_pool_meta(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5369248571Smm    zfs_secpolicy_func_t *secpolicy)
5370248571Smm{
5371248571Smm	zfs_ioctl_register_legacy(ioc, func, secpolicy,
5372248571Smm	    NO_NAME, B_FALSE, POOL_CHECK_NONE);
5373248571Smm}
5374248571Smm
5375248571Smmstatic void
5376248571Smmzfs_ioctl_register_dataset_read_secpolicy(zfs_ioc_t ioc,
5377248571Smm    zfs_ioc_legacy_func_t *func, zfs_secpolicy_func_t *secpolicy)
5378248571Smm{
5379248571Smm	zfs_ioctl_register_legacy(ioc, func, secpolicy,
5380248571Smm	    DATASET_NAME, B_FALSE, POOL_CHECK_SUSPENDED);
5381248571Smm}
5382248571Smm
5383248571Smmstatic void
5384248571Smmzfs_ioctl_register_dataset_read(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func)
5385248571Smm{
5386248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ioc, func,
5387248571Smm	    zfs_secpolicy_read);
5388248571Smm}
5389248571Smm
5390248571Smmstatic void
5391248571Smmzfs_ioctl_register_dataset_modify(zfs_ioc_t ioc, zfs_ioc_legacy_func_t *func,
5392248571Smm	zfs_secpolicy_func_t *secpolicy)
5393248571Smm{
5394248571Smm	zfs_ioctl_register_legacy(ioc, func, secpolicy,
5395248571Smm	    DATASET_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5396248571Smm}
5397248571Smm
5398248571Smmstatic void
5399248571Smmzfs_ioctl_init(void)
5400248571Smm{
5401248571Smm	zfs_ioctl_register("snapshot", ZFS_IOC_SNAPSHOT,
5402248571Smm	    zfs_ioc_snapshot, zfs_secpolicy_snapshot, POOL_NAME,
5403248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5404248571Smm
5405248571Smm	zfs_ioctl_register("log_history", ZFS_IOC_LOG_HISTORY,
5406248571Smm	    zfs_ioc_log_history, zfs_secpolicy_log_history, NO_NAME,
5407248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_FALSE, B_FALSE);
5408248571Smm
5409248571Smm	zfs_ioctl_register("space_snaps", ZFS_IOC_SPACE_SNAPS,
5410248571Smm	    zfs_ioc_space_snaps, zfs_secpolicy_read, DATASET_NAME,
5411248571Smm	    POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5412248571Smm
5413248571Smm	zfs_ioctl_register("send", ZFS_IOC_SEND_NEW,
5414248571Smm	    zfs_ioc_send_new, zfs_secpolicy_send_new, DATASET_NAME,
5415248571Smm	    POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5416248571Smm
5417248571Smm	zfs_ioctl_register("send_space", ZFS_IOC_SEND_SPACE,
5418248571Smm	    zfs_ioc_send_space, zfs_secpolicy_read, DATASET_NAME,
5419248571Smm	    POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5420248571Smm
5421248571Smm	zfs_ioctl_register("create", ZFS_IOC_CREATE,
5422248571Smm	    zfs_ioc_create, zfs_secpolicy_create_clone, DATASET_NAME,
5423248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5424248571Smm
5425248571Smm	zfs_ioctl_register("clone", ZFS_IOC_CLONE,
5426248571Smm	    zfs_ioc_clone, zfs_secpolicy_create_clone, DATASET_NAME,
5427248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5428248571Smm
5429248571Smm	zfs_ioctl_register("destroy_snaps", ZFS_IOC_DESTROY_SNAPS,
5430248571Smm	    zfs_ioc_destroy_snaps, zfs_secpolicy_destroy_snaps, POOL_NAME,
5431248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5432248571Smm
5433248571Smm	zfs_ioctl_register("hold", ZFS_IOC_HOLD,
5434248571Smm	    zfs_ioc_hold, zfs_secpolicy_hold, POOL_NAME,
5435248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5436248571Smm	zfs_ioctl_register("release", ZFS_IOC_RELEASE,
5437248571Smm	    zfs_ioc_release, zfs_secpolicy_release, POOL_NAME,
5438248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY, B_TRUE, B_TRUE);
5439248571Smm
5440248571Smm	zfs_ioctl_register("get_holds", ZFS_IOC_GET_HOLDS,
5441248571Smm	    zfs_ioc_get_holds, zfs_secpolicy_read, DATASET_NAME,
5442248571Smm	    POOL_CHECK_SUSPENDED, B_FALSE, B_FALSE);
5443248571Smm
5444248571Smm	/* IOCTLS that use the legacy function signature */
5445248571Smm
5446248571Smm	zfs_ioctl_register_legacy(ZFS_IOC_POOL_FREEZE, zfs_ioc_pool_freeze,
5447248571Smm	    zfs_secpolicy_config, NO_NAME, B_FALSE, POOL_CHECK_READONLY);
5448248571Smm
5449248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_CREATE, zfs_ioc_pool_create,
5450248571Smm	    zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5451248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SCAN,
5452248571Smm	    zfs_ioc_pool_scan);
5453248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_UPGRADE,
5454248571Smm	    zfs_ioc_pool_upgrade);
5455248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ADD,
5456248571Smm	    zfs_ioc_vdev_add);
5457248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_REMOVE,
5458248571Smm	    zfs_ioc_vdev_remove);
5459248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SET_STATE,
5460248571Smm	    zfs_ioc_vdev_set_state);
5461248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_ATTACH,
5462248571Smm	    zfs_ioc_vdev_attach);
5463248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_DETACH,
5464248571Smm	    zfs_ioc_vdev_detach);
5465248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETPATH,
5466248571Smm	    zfs_ioc_vdev_setpath);
5467248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SETFRU,
5468248571Smm	    zfs_ioc_vdev_setfru);
5469248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_SET_PROPS,
5470248571Smm	    zfs_ioc_pool_set_props);
5471248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_VDEV_SPLIT,
5472248571Smm	    zfs_ioc_vdev_split);
5473248571Smm	zfs_ioctl_register_pool_modify(ZFS_IOC_POOL_REGUID,
5474248571Smm	    zfs_ioc_pool_reguid);
5475248571Smm
5476248571Smm	zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_CONFIGS,
5477248571Smm	    zfs_ioc_pool_configs, zfs_secpolicy_none);
5478248571Smm	zfs_ioctl_register_pool_meta(ZFS_IOC_POOL_TRYIMPORT,
5479248571Smm	    zfs_ioc_pool_tryimport, zfs_secpolicy_config);
5480248571Smm	zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_FAULT,
5481248571Smm	    zfs_ioc_inject_fault, zfs_secpolicy_inject);
5482248571Smm	zfs_ioctl_register_pool_meta(ZFS_IOC_CLEAR_FAULT,
5483248571Smm	    zfs_ioc_clear_fault, zfs_secpolicy_inject);
5484248571Smm	zfs_ioctl_register_pool_meta(ZFS_IOC_INJECT_LIST_NEXT,
5485248571Smm	    zfs_ioc_inject_list_next, zfs_secpolicy_inject);
5486248571Smm
5487248571Smm	/*
5488248571Smm	 * pool destroy, and export don't log the history as part of
5489248571Smm	 * zfsdev_ioctl, but rather zfs_ioc_pool_export
5490248571Smm	 * does the logging of those commands.
5491248571Smm	 */
5492248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_DESTROY, zfs_ioc_pool_destroy,
5493248571Smm	    zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5494248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_EXPORT, zfs_ioc_pool_export,
5495248571Smm	    zfs_secpolicy_config, B_FALSE, POOL_CHECK_NONE);
5496248571Smm
5497248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_STATS, zfs_ioc_pool_stats,
5498248571Smm	    zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5499248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_PROPS, zfs_ioc_pool_get_props,
5500248571Smm	    zfs_secpolicy_read, B_FALSE, POOL_CHECK_NONE);
5501248571Smm
5502248571Smm	zfs_ioctl_register_pool(ZFS_IOC_ERROR_LOG, zfs_ioc_error_log,
5503248571Smm	    zfs_secpolicy_inject, B_FALSE, POOL_CHECK_SUSPENDED);
5504248571Smm	zfs_ioctl_register_pool(ZFS_IOC_DSOBJ_TO_DSNAME,
5505248571Smm	    zfs_ioc_dsobj_to_dsname,
5506248571Smm	    zfs_secpolicy_diff, B_FALSE, POOL_CHECK_SUSPENDED);
5507248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_GET_HISTORY,
5508248571Smm	    zfs_ioc_pool_get_history,
5509248571Smm	    zfs_secpolicy_config, B_FALSE, POOL_CHECK_SUSPENDED);
5510248571Smm
5511248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_IMPORT, zfs_ioc_pool_import,
5512248571Smm	    zfs_secpolicy_config, B_TRUE, POOL_CHECK_NONE);
5513248571Smm
5514248571Smm	zfs_ioctl_register_pool(ZFS_IOC_CLEAR, zfs_ioc_clear,
5515248571Smm	    zfs_secpolicy_config, B_TRUE, POOL_CHECK_SUSPENDED);
5516248571Smm	zfs_ioctl_register_pool(ZFS_IOC_POOL_REOPEN, zfs_ioc_pool_reopen,
5517248571Smm	    zfs_secpolicy_config, B_TRUE, POOL_CHECK_SUSPENDED);
5518248571Smm
5519248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_SPACE_WRITTEN,
5520248571Smm	    zfs_ioc_space_written);
5521248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_RECVD_PROPS,
5522248571Smm	    zfs_ioc_objset_recvd_props);
5523248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_NEXT_OBJ,
5524248571Smm	    zfs_ioc_next_obj);
5525248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_GET_FSACL,
5526248571Smm	    zfs_ioc_get_fsacl);
5527248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_STATS,
5528248571Smm	    zfs_ioc_objset_stats);
5529248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_OBJSET_ZPLPROPS,
5530248571Smm	    zfs_ioc_objset_zplprops);
5531248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_DATASET_LIST_NEXT,
5532248571Smm	    zfs_ioc_dataset_list_next);
5533248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_SNAPSHOT_LIST_NEXT,
5534248571Smm	    zfs_ioc_snapshot_list_next);
5535248571Smm	zfs_ioctl_register_dataset_read(ZFS_IOC_SEND_PROGRESS,
5536248571Smm	    zfs_ioc_send_progress);
5537248571Smm
5538248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_DIFF,
5539248571Smm	    zfs_ioc_diff, zfs_secpolicy_diff);
5540248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_STATS,
5541248571Smm	    zfs_ioc_obj_to_stats, zfs_secpolicy_diff);
5542248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_OBJ_TO_PATH,
5543248571Smm	    zfs_ioc_obj_to_path, zfs_secpolicy_diff);
5544248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_ONE,
5545248571Smm	    zfs_ioc_userspace_one, zfs_secpolicy_userspace_one);
5546248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_USERSPACE_MANY,
5547248571Smm	    zfs_ioc_userspace_many, zfs_secpolicy_userspace_many);
5548248571Smm	zfs_ioctl_register_dataset_read_secpolicy(ZFS_IOC_SEND,
5549248571Smm	    zfs_ioc_send, zfs_secpolicy_send);
5550248571Smm
5551248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_PROP, zfs_ioc_set_prop,
5552248571Smm	    zfs_secpolicy_none);
5553248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_DESTROY, zfs_ioc_destroy,
5554248571Smm	    zfs_secpolicy_destroy);
5555248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_ROLLBACK, zfs_ioc_rollback,
5556248571Smm	    zfs_secpolicy_rollback);
5557248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_RENAME, zfs_ioc_rename,
5558248571Smm	    zfs_secpolicy_rename);
5559248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_RECV, zfs_ioc_recv,
5560248571Smm	    zfs_secpolicy_recv);
5561248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_PROMOTE, zfs_ioc_promote,
5562248571Smm	    zfs_secpolicy_promote);
5563248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_INHERIT_PROP,
5564248571Smm	    zfs_ioc_inherit_prop, zfs_secpolicy_inherit_prop);
5565248571Smm	zfs_ioctl_register_dataset_modify(ZFS_IOC_SET_FSACL, zfs_ioc_set_fsacl,
5566248571Smm	    zfs_secpolicy_set_fsacl);
5567248571Smm
5568248571Smm	zfs_ioctl_register_dataset_nolog(ZFS_IOC_SHARE, zfs_ioc_share,
5569248571Smm	    zfs_secpolicy_share, POOL_CHECK_NONE);
5570248571Smm	zfs_ioctl_register_dataset_nolog(ZFS_IOC_SMB_ACL, zfs_ioc_smb_acl,
5571248571Smm	    zfs_secpolicy_smb_acl, POOL_CHECK_NONE);
5572248571Smm	zfs_ioctl_register_dataset_nolog(ZFS_IOC_USERSPACE_UPGRADE,
5573248571Smm	    zfs_ioc_userspace_upgrade, zfs_secpolicy_userspace_upgrade,
5574248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5575248571Smm	zfs_ioctl_register_dataset_nolog(ZFS_IOC_TMP_SNAPSHOT,
5576248571Smm	    zfs_ioc_tmp_snapshot, zfs_secpolicy_tmp_snapshot,
5577248571Smm	    POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY);
5578248571Smm}
5579248571Smm
5580209962Smmint
5581246688Smmpool_status_check(const char *name, zfs_ioc_namecheck_t type,
5582246688Smm    zfs_ioc_poolcheck_t check)
5583209962Smm{
5584209962Smm	spa_t *spa;
5585209962Smm	int error;
5586209962Smm
5587209962Smm	ASSERT(type == POOL_NAME || type == DATASET_NAME);
5588209962Smm
5589246688Smm	if (check & POOL_CHECK_NONE)
5590246688Smm		return (0);
5591246688Smm
5592209962Smm	error = spa_open(name, &spa, FTAG);
5593209962Smm	if (error == 0) {
5594246688Smm		if ((check & POOL_CHECK_SUSPENDED) && spa_suspended(spa))
5595249195Smm			error = SET_ERROR(EAGAIN);
5596246688Smm		else if ((check & POOL_CHECK_READONLY) && !spa_writeable(spa))
5597249195Smm			error = SET_ERROR(EROFS);
5598209962Smm		spa_close(spa, FTAG);
5599209962Smm	}
5600209962Smm	return (error);
5601209962Smm}
5602209962Smm
5603219089Spjd/*
5604219089Spjd * Find a free minor number.
5605219089Spjd */
5606219089Spjdminor_t
5607219089Spjdzfsdev_minor_alloc(void)
5608219089Spjd{
5609219089Spjd	static minor_t last_minor;
5610219089Spjd	minor_t m;
5611219089Spjd
5612224791Spjd	ASSERT(MUTEX_HELD(&spa_namespace_lock));
5613219089Spjd
5614219089Spjd	for (m = last_minor + 1; m != last_minor; m++) {
5615219089Spjd		if (m > ZFSDEV_MAX_MINOR)
5616219089Spjd			m = 1;
5617219089Spjd		if (ddi_get_soft_state(zfsdev_state, m) == NULL) {
5618219089Spjd			last_minor = m;
5619219089Spjd			return (m);
5620219089Spjd		}
5621219089Spjd	}
5622219089Spjd
5623219089Spjd	return (0);
5624219089Spjd}
5625219089Spjd
5626168404Spjdstatic int
5627219089Spjdzfs_ctldev_init(struct cdev *devp)
5628219089Spjd{
5629219089Spjd	minor_t minor;
5630219089Spjd	zfs_soft_state_t *zs;
5631219089Spjd
5632224791Spjd	ASSERT(MUTEX_HELD(&spa_namespace_lock));
5633219089Spjd
5634219089Spjd	minor = zfsdev_minor_alloc();
5635219089Spjd	if (minor == 0)
5636249195Smm		return (SET_ERROR(ENXIO));
5637219089Spjd
5638219089Spjd	if (ddi_soft_state_zalloc(zfsdev_state, minor) != DDI_SUCCESS)
5639249195Smm		return (SET_ERROR(EAGAIN));
5640219089Spjd
5641219089Spjd	devfs_set_cdevpriv((void *)(uintptr_t)minor, zfsdev_close);
5642219089Spjd
5643219089Spjd	zs = ddi_get_soft_state(zfsdev_state, minor);
5644219089Spjd	zs->zss_type = ZSST_CTLDEV;
5645219089Spjd	zfs_onexit_init((zfs_onexit_t **)&zs->zss_data);
5646219089Spjd
5647219089Spjd	return (0);
5648219089Spjd}
5649219089Spjd
5650219089Spjdstatic void
5651219089Spjdzfs_ctldev_destroy(zfs_onexit_t *zo, minor_t minor)
5652219089Spjd{
5653224791Spjd	ASSERT(MUTEX_HELD(&spa_namespace_lock));
5654219089Spjd
5655219089Spjd	zfs_onexit_destroy(zo);
5656219089Spjd	ddi_soft_state_free(zfsdev_state, minor);
5657219089Spjd}
5658219089Spjd
5659219089Spjdvoid *
5660219089Spjdzfsdev_get_soft_state(minor_t minor, enum zfs_soft_state_type which)
5661219089Spjd{
5662219089Spjd	zfs_soft_state_t *zp;
5663219089Spjd
5664219089Spjd	zp = ddi_get_soft_state(zfsdev_state, minor);
5665219089Spjd	if (zp == NULL || zp->zss_type != which)
5666219089Spjd		return (NULL);
5667219089Spjd
5668219089Spjd	return (zp->zss_data);
5669219089Spjd}
5670219089Spjd
5671219089Spjdstatic int
5672219089Spjdzfsdev_open(struct cdev *devp, int flag, int mode, struct thread *td)
5673219089Spjd{
5674219089Spjd	int error = 0;
5675219089Spjd
5676219089Spjd#ifdef sun
5677219089Spjd	if (getminor(*devp) != 0)
5678219089Spjd		return (zvol_open(devp, flag, otyp, cr));
5679219089Spjd#endif
5680219089Spjd
5681219089Spjd	/* This is the control device. Allocate a new minor if requested. */
5682219089Spjd	if (flag & FEXCL) {
5683224791Spjd		mutex_enter(&spa_namespace_lock);
5684219089Spjd		error = zfs_ctldev_init(devp);
5685224791Spjd		mutex_exit(&spa_namespace_lock);
5686219089Spjd	}
5687219089Spjd
5688219089Spjd	return (error);
5689219089Spjd}
5690219089Spjd
5691219089Spjdstatic void
5692219089Spjdzfsdev_close(void *data)
5693219089Spjd{
5694219089Spjd	zfs_onexit_t *zo;
5695219089Spjd	minor_t minor = (minor_t)(uintptr_t)data;
5696219089Spjd
5697219089Spjd	if (minor == 0)
5698219089Spjd		return;
5699219089Spjd
5700224791Spjd	mutex_enter(&spa_namespace_lock);
5701219089Spjd	zo = zfsdev_get_soft_state(minor, ZSST_CTLDEV);
5702219089Spjd	if (zo == NULL) {
5703224791Spjd		mutex_exit(&spa_namespace_lock);
5704219089Spjd		return;
5705219089Spjd	}
5706219089Spjd	zfs_ctldev_destroy(zo, minor);
5707224791Spjd	mutex_exit(&spa_namespace_lock);
5708219089Spjd}
5709219089Spjd
5710219089Spjdstatic int
5711248571Smmzfsdev_ioctl(struct cdev *dev, u_long zcmd, caddr_t arg, int flag,
5712168404Spjd    struct thread *td)
5713168404Spjd{
5714219089Spjd	zfs_cmd_t *zc;
5715248571Smm	uint_t vecnum;
5716249319Smm	int error, rc, len;
5717249004Smm#ifdef illumos
5718248571Smm	minor_t minor = getminor(dev);
5719248571Smm#else
5720249319Smm	zfs_iocparm_t *zc_iocparm;
5721249319Smm	int cflag, cmd, oldvecnum;
5722249319Smm	boolean_t newioc, compat;
5723248571Smm	cred_t *cr = td->td_ucred;
5724248571Smm#endif
5725248571Smm	const zfs_ioc_vec_t *vec;
5726248571Smm	char *saved_poolname = NULL;
5727248571Smm	nvlist_t *innvl = NULL;
5728168404Spjd
5729219089Spjd	cflag = ZFS_CMD_COMPAT_NONE;
5730249319Smm	compat = B_FALSE;
5731249319Smm	newioc = B_TRUE;
5732249319Smm
5733248571Smm	len = IOCPARM_LEN(zcmd);
5734248571Smm	cmd = zcmd & 0xff;
5735219089Spjd
5736214854Sdelphij	/*
5737247540Smm	 * Check if we are talking to supported older binaries
5738247540Smm	 * and translate zfs_cmd if necessary
5739214854Sdelphij	 */
5740249319Smm	if (len != sizeof(zfs_iocparm_t)) {
5741249319Smm		newioc = B_FALSE;
5742249319Smm		if (len == sizeof(zfs_cmd_t)) {
5743249319Smm			cflag = ZFS_CMD_COMPAT_LZC;
5744249319Smm			vecnum = cmd;
5745249319Smm		} else if (len == sizeof(zfs_cmd_deadman_t)) {
5746248571Smm			cflag = ZFS_CMD_COMPAT_DEADMAN;
5747249319Smm			compat = B_TRUE;
5748248571Smm			vecnum = cmd;
5749248571Smm		} else if (len == sizeof(zfs_cmd_v28_t)) {
5750247540Smm			cflag = ZFS_CMD_COMPAT_V28;
5751249319Smm			compat = B_TRUE;
5752248571Smm			vecnum = cmd;
5753247540Smm		} else if (len == sizeof(zfs_cmd_v15_t)) {
5754219089Spjd			cflag = ZFS_CMD_COMPAT_V15;
5755249319Smm			compat = B_TRUE;
5756248571Smm			vecnum = zfs_ioctl_v15_to_v28[cmd];
5757219089Spjd		} else
5758219089Spjd			return (EINVAL);
5759249319Smm	} else
5760248571Smm		vecnum = cmd;
5761214854Sdelphij
5762248571Smm#ifdef illumos
5763248571Smm	vecnum = cmd - ZFS_IOC_FIRST;
5764248571Smm	ASSERT3U(getmajor(dev), ==, ddi_driver_major(zfs_dip));
5765248571Smm#endif
5766248571Smm
5767249319Smm	if (compat) {
5768248571Smm		if (vecnum == ZFS_IOC_COMPAT_PASS)
5769219089Spjd			return (0);
5770248571Smm		else if (vecnum == ZFS_IOC_COMPAT_FAIL)
5771219089Spjd			return (ENOTSUP);
5772219089Spjd	}
5773168404Spjd
5774247540Smm	/*
5775247540Smm	 * Check if we have sufficient kernel memory allocated
5776247540Smm	 * for the zfs_cmd_t request.  Bail out if not so we
5777247540Smm	 * will not access undefined memory region.
5778247540Smm	 */
5779248571Smm	if (vecnum >= sizeof (zfs_ioc_vec) / sizeof (zfs_ioc_vec[0]))
5780249195Smm		return (SET_ERROR(EINVAL));
5781248571Smm	vec = &zfs_ioc_vec[vecnum];
5782168404Spjd
5783248571Smm#ifdef illumos
5784248571Smm	zc = kmem_zalloc(sizeof(zfs_cmd_t), KM_SLEEP);
5785248571Smm	bzero(zc, sizeof(zfs_cmd_t));
5786248571Smm
5787248571Smm	error = ddi_copyin((void *)arg, zc, sizeof (zfs_cmd_t), flag);
5788248571Smm	if (error != 0) {
5789249195Smm		error = SET_ERROR(EFAULT);
5790248571Smm		goto out;
5791248571Smm	}
5792249319Smm#else	/* !illumos */
5793249319Smm	/*
5794249319Smm	 * We don't alloc/free zc only if talking to library ioctl version 2
5795249319Smm	 */
5796249319Smm	if (cflag != ZFS_CMD_COMPAT_LZC) {
5797219089Spjd		zc = kmem_zalloc(sizeof(zfs_cmd_t), KM_SLEEP);
5798219089Spjd		bzero(zc, sizeof(zfs_cmd_t));
5799249319Smm	} else {
5800249319Smm		zc = (void *)arg;
5801249319Smm		error = 0;
5802249319Smm	}
5803249319Smm
5804249319Smm	if (newioc) {
5805249319Smm		zc_iocparm = (void *)arg;
5806249319Smm		if (zc_iocparm->zfs_cmd_size != sizeof(zfs_cmd_t)) {
5807249319Smm			error = SET_ERROR(EFAULT);
5808249319Smm			goto out;
5809249319Smm		}
5810249319Smm		error = ddi_copyin((void *)zc_iocparm->zfs_cmd, zc,
5811249319Smm		    sizeof(zfs_cmd_t), flag);
5812249319Smm		if (error != 0) {
5813249319Smm			error = SET_ERROR(EFAULT);
5814249319Smm			goto out;
5815249319Smm		}
5816249319Smm	}
5817249319Smm
5818249319Smm	if (compat) {
5819248571Smm		zfs_cmd_compat_get(zc, arg, cflag);
5820248571Smm		oldvecnum = vecnum;
5821248571Smm		error = zfs_ioctl_compat_pre(zc, &vecnum, cflag);
5822248571Smm		if (error != 0)
5823248571Smm			goto out;
5824248571Smm		if (oldvecnum != vecnum)
5825248571Smm			vec = &zfs_ioc_vec[vecnum];
5826249319Smm	}
5827249319Smm#endif	/* !illumos */
5828248571Smm
5829248571Smm	zc->zc_iflags = flag & FKIOCTL;
5830248571Smm	if (zc->zc_nvlist_src_size != 0) {
5831248571Smm		error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
5832248571Smm		    zc->zc_iflags, &innvl);
5833248571Smm		if (error != 0)
5834248571Smm			goto out;
5835219089Spjd	}
5836219089Spjd
5837248571Smm	/* rewrite innvl for backwards compatibility */
5838249319Smm	if (compat)
5839248571Smm		innvl = zfs_ioctl_compat_innvl(zc, innvl, vecnum, cflag);
5840168404Spjd
5841168404Spjd	/*
5842168404Spjd	 * Ensure that all pool/dataset names are valid before we pass down to
5843168404Spjd	 * the lower layers.
5844168404Spjd	 */
5845248571Smm	zc->zc_name[sizeof (zc->zc_name) - 1] = '\0';
5846248571Smm	switch (vec->zvec_namecheck) {
5847248571Smm	case POOL_NAME:
5848248571Smm		if (pool_namecheck(zc->zc_name, NULL, NULL) != 0)
5849249195Smm			error = SET_ERROR(EINVAL);
5850248571Smm		else
5851248571Smm			error = pool_status_check(zc->zc_name,
5852248571Smm			    vec->zvec_namecheck, vec->zvec_pool_check);
5853248571Smm		break;
5854168404Spjd
5855248571Smm	case DATASET_NAME:
5856248571Smm		if (dataset_namecheck(zc->zc_name, NULL, NULL) != 0)
5857249195Smm			error = SET_ERROR(EINVAL);
5858248571Smm		else
5859248571Smm			error = pool_status_check(zc->zc_name,
5860248571Smm			    vec->zvec_namecheck, vec->zvec_pool_check);
5861248571Smm		break;
5862168404Spjd
5863248571Smm	case NO_NAME:
5864248571Smm		break;
5865168404Spjd	}
5866168404Spjd
5867248571Smm	if (error == 0 && !(flag & FKIOCTL))
5868248571Smm		error = vec->zvec_secpolicy(zc, innvl, cr);
5869168404Spjd
5870248571Smm	if (error != 0)
5871248571Smm		goto out;
5872248571Smm
5873248571Smm	/* legacy ioctls can modify zc_name */
5874248571Smm	len = strcspn(zc->zc_name, "/@") + 1;
5875248571Smm	saved_poolname = kmem_alloc(len, KM_SLEEP);
5876248571Smm	(void) strlcpy(saved_poolname, zc->zc_name, len);
5877248571Smm
5878248571Smm	if (vec->zvec_func != NULL) {
5879248571Smm		nvlist_t *outnvl;
5880248571Smm		int puterror = 0;
5881248571Smm		spa_t *spa;
5882248571Smm		nvlist_t *lognv = NULL;
5883248571Smm
5884248571Smm		ASSERT(vec->zvec_legacy_func == NULL);
5885248571Smm
5886248571Smm		/*
5887248571Smm		 * Add the innvl to the lognv before calling the func,
5888248571Smm		 * in case the func changes the innvl.
5889248571Smm		 */
5890248571Smm		if (vec->zvec_allow_log) {
5891248571Smm			lognv = fnvlist_alloc();
5892248571Smm			fnvlist_add_string(lognv, ZPOOL_HIST_IOCTL,
5893248571Smm			    vec->zvec_name);
5894248571Smm			if (!nvlist_empty(innvl)) {
5895248571Smm				fnvlist_add_nvlist(lognv, ZPOOL_HIST_INPUT_NVL,
5896248571Smm				    innvl);
5897248571Smm			}
5898248571Smm		}
5899248571Smm
5900248571Smm		outnvl = fnvlist_alloc();
5901248571Smm		error = vec->zvec_func(zc->zc_name, innvl, outnvl);
5902248571Smm
5903248571Smm		if (error == 0 && vec->zvec_allow_log &&
5904248571Smm		    spa_open(zc->zc_name, &spa, FTAG) == 0) {
5905248571Smm			if (!nvlist_empty(outnvl)) {
5906248571Smm				fnvlist_add_nvlist(lognv, ZPOOL_HIST_OUTPUT_NVL,
5907248571Smm				    outnvl);
5908248571Smm			}
5909248571Smm			(void) spa_history_log_nvl(spa, lognv);
5910248571Smm			spa_close(spa, FTAG);
5911248571Smm		}
5912248571Smm		fnvlist_free(lognv);
5913248571Smm
5914248571Smm		/* rewrite outnvl for backwards compatibility */
5915249319Smm		if (cflag != ZFS_CMD_COMPAT_NONE && cflag != ZFS_CMD_COMPAT_LZC)
5916248571Smm			outnvl = zfs_ioctl_compat_outnvl(zc, outnvl, vecnum,
5917248571Smm			    cflag);
5918248571Smm
5919248571Smm		if (!nvlist_empty(outnvl) || zc->zc_nvlist_dst_size != 0) {
5920248571Smm			int smusherror = 0;
5921248571Smm			if (vec->zvec_smush_outnvlist) {
5922248571Smm				smusherror = nvlist_smush(outnvl,
5923248571Smm				    zc->zc_nvlist_dst_size);
5924248571Smm			}
5925248571Smm			if (smusherror == 0)
5926248571Smm				puterror = put_nvlist(zc, outnvl);
5927248571Smm		}
5928248571Smm
5929248571Smm		if (puterror != 0)
5930248571Smm			error = puterror;
5931248571Smm
5932248571Smm		nvlist_free(outnvl);
5933248571Smm	} else {
5934248571Smm		error = vec->zvec_legacy_func(zc);
5935196985Spjd	}
5936185029Spjd
5937248571Smmout:
5938248571Smm	nvlist_free(innvl);
5939249319Smm
5940249319Smm	if (compat) {
5941249319Smm		zfs_ioctl_compat_post(zc, cmd, cflag);
5942249319Smm		zfs_cmd_compat_put(zc, arg, vecnum, cflag);
5943249319Smm	}
5944249319Smm
5945249004Smm#ifdef illumos
5946249004Smm	rc = ddi_copyout(zc, (void *)arg, sizeof (zfs_cmd_t), flag);
5947248571Smm	if (error == 0 && rc != 0)
5948249195Smm		error = SET_ERROR(EFAULT);
5949249319Smm#else
5950249319Smm	if (newioc) {
5951249319Smm		rc = ddi_copyout(zc, (void *)zc_iocparm->zfs_cmd,
5952249319Smm		    sizeof (zfs_cmd_t), flag);
5953249319Smm		if (error == 0 && rc != 0)
5954249319Smm			error = SET_ERROR(EFAULT);
5955249319Smm	}
5956249004Smm#endif
5957248571Smm	if (error == 0 && vec->zvec_allow_log) {
5958248571Smm		char *s = tsd_get(zfs_allow_log_key);
5959248571Smm		if (s != NULL)
5960248571Smm			strfree(s);
5961248571Smm		(void) tsd_set(zfs_allow_log_key, saved_poolname);
5962248571Smm	} else {
5963248571Smm		if (saved_poolname != NULL)
5964248571Smm			strfree(saved_poolname);
5965248571Smm	}
5966248571Smm
5967248571Smm#ifdef illumos
5968248571Smm	kmem_free(zc, sizeof (zfs_cmd_t));
5969249319Smm#else
5970249319Smm	/*
5971249319Smm	 * We don't alloc/free zc only if talking to library ioctl version 2
5972249319Smm	 */
5973249319Smm	if (cflag != ZFS_CMD_COMPAT_LZC)
5974249319Smm		kmem_free(zc, sizeof (zfs_cmd_t));
5975248571Smm#endif
5976168404Spjd	return (error);
5977168404Spjd}
5978168404Spjd
5979219089Spjd#ifdef sun
5980219089Spjdstatic int
5981219089Spjdzfs_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
5982219089Spjd{
5983219089Spjd	if (cmd != DDI_ATTACH)
5984219089Spjd		return (DDI_FAILURE);
5985219089Spjd
5986219089Spjd	if (ddi_create_minor_node(dip, "zfs", S_IFCHR, 0,
5987219089Spjd	    DDI_PSEUDO, 0) == DDI_FAILURE)
5988219089Spjd		return (DDI_FAILURE);
5989219089Spjd
5990219089Spjd	zfs_dip = dip;
5991219089Spjd
5992219089Spjd	ddi_report_dev(dip);
5993219089Spjd
5994219089Spjd	return (DDI_SUCCESS);
5995219089Spjd}
5996219089Spjd
5997219089Spjdstatic int
5998219089Spjdzfs_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
5999219089Spjd{
6000219089Spjd	if (spa_busy() || zfs_busy() || zvol_busy())
6001219089Spjd		return (DDI_FAILURE);
6002219089Spjd
6003219089Spjd	if (cmd != DDI_DETACH)
6004219089Spjd		return (DDI_FAILURE);
6005219089Spjd
6006219089Spjd	zfs_dip = NULL;
6007219089Spjd
6008219089Spjd	ddi_prop_remove_all(dip);
6009219089Spjd	ddi_remove_minor_node(dip, NULL);
6010219089Spjd
6011219089Spjd	return (DDI_SUCCESS);
6012219089Spjd}
6013219089Spjd
6014219089Spjd/*ARGSUSED*/
6015219089Spjdstatic int
6016219089Spjdzfs_info(dev_info_t *dip, ddi_info_cmd_t infocmd, void *arg, void **result)
6017219089Spjd{
6018219089Spjd	switch (infocmd) {
6019219089Spjd	case DDI_INFO_DEVT2DEVINFO:
6020219089Spjd		*result = zfs_dip;
6021219089Spjd		return (DDI_SUCCESS);
6022219089Spjd
6023219089Spjd	case DDI_INFO_DEVT2INSTANCE:
6024219089Spjd		*result = (void *)0;
6025219089Spjd		return (DDI_SUCCESS);
6026219089Spjd	}
6027219089Spjd
6028219089Spjd	return (DDI_FAILURE);
6029219089Spjd}
6030219089Spjd#endif	/* sun */
6031219089Spjd
6032168404Spjd/*
6033168404Spjd * OK, so this is a little weird.
6034168404Spjd *
6035168404Spjd * /dev/zfs is the control node, i.e. minor 0.
6036168404Spjd * /dev/zvol/[r]dsk/pool/dataset are the zvols, minor > 0.
6037168404Spjd *
6038168404Spjd * /dev/zfs has basically nothing to do except serve up ioctls,
6039168404Spjd * so most of the standard driver entry points are in zvol.c.
6040168404Spjd */
6041219089Spjd#ifdef sun
6042219089Spjdstatic struct cb_ops zfs_cb_ops = {
6043219089Spjd	zfsdev_open,	/* open */
6044219089Spjd	zfsdev_close,	/* close */
6045219089Spjd	zvol_strategy,	/* strategy */
6046219089Spjd	nodev,		/* print */
6047219089Spjd	zvol_dump,	/* dump */
6048219089Spjd	zvol_read,	/* read */
6049219089Spjd	zvol_write,	/* write */
6050219089Spjd	zfsdev_ioctl,	/* ioctl */
6051219089Spjd	nodev,		/* devmap */
6052219089Spjd	nodev,		/* mmap */
6053219089Spjd	nodev,		/* segmap */
6054219089Spjd	nochpoll,	/* poll */
6055219089Spjd	ddi_prop_op,	/* prop_op */
6056219089Spjd	NULL,		/* streamtab */
6057219089Spjd	D_NEW | D_MP | D_64BIT,		/* Driver compatibility flag */
6058219089Spjd	CB_REV,		/* version */
6059219089Spjd	nodev,		/* async read */
6060219089Spjd	nodev,		/* async write */
6061219089Spjd};
6062219089Spjd
6063219089Spjdstatic struct dev_ops zfs_dev_ops = {
6064219089Spjd	DEVO_REV,	/* version */
6065219089Spjd	0,		/* refcnt */
6066219089Spjd	zfs_info,	/* info */
6067219089Spjd	nulldev,	/* identify */
6068219089Spjd	nulldev,	/* probe */
6069219089Spjd	zfs_attach,	/* attach */
6070219089Spjd	zfs_detach,	/* detach */
6071219089Spjd	nodev,		/* reset */
6072219089Spjd	&zfs_cb_ops,	/* driver operations */
6073219089Spjd	NULL,		/* no bus operations */
6074219089Spjd	NULL,		/* power */
6075219089Spjd	ddi_quiesce_not_needed,	/* quiesce */
6076219089Spjd};
6077219089Spjd
6078219089Spjdstatic struct modldrv zfs_modldrv = {
6079219089Spjd	&mod_driverops,
6080219089Spjd	"ZFS storage pool",
6081219089Spjd	&zfs_dev_ops
6082219089Spjd};
6083219089Spjd
6084219089Spjdstatic struct modlinkage modlinkage = {
6085219089Spjd	MODREV_1,
6086219089Spjd	(void *)&zfs_modlfs,
6087219089Spjd	(void *)&zfs_modldrv,
6088219089Spjd	NULL
6089219089Spjd};
6090219089Spjd#endif	/* sun */
6091219089Spjd
6092168404Spjdstatic struct cdevsw zfs_cdevsw = {
6093168404Spjd	.d_version =	D_VERSION,
6094219089Spjd	.d_open =	zfsdev_open,
6095168404Spjd	.d_ioctl =	zfsdev_ioctl,
6096168404Spjd	.d_name =	ZFS_DEV_NAME
6097168404Spjd};
6098168404Spjd
6099168404Spjdstatic void
6100248571Smmzfs_allow_log_destroy(void *arg)
6101248571Smm{
6102248571Smm	char *poolname = arg;
6103248571Smm	strfree(poolname);
6104248571Smm}
6105248571Smm
6106248571Smmstatic void
6107168404Spjdzfsdev_init(void)
6108168404Spjd{
6109185029Spjd	zfsdev = make_dev(&zfs_cdevsw, 0x0, UID_ROOT, GID_OPERATOR, 0666,
6110168404Spjd	    ZFS_DEV_NAME);
6111168404Spjd}
6112168404Spjd
6113168404Spjdstatic void
6114168404Spjdzfsdev_fini(void)
6115168404Spjd{
6116168404Spjd	if (zfsdev != NULL)
6117168404Spjd		destroy_dev(zfsdev);
6118168404Spjd}
6119168404Spjd
6120169929Spjdstatic struct root_hold_token *zfs_root_token;
6121196458Spjdstruct proc *zfsproc;
6122168404Spjd
6123219089Spjd#ifdef sun
6124219089Spjdint
6125219089Spjd_init(void)
6126219089Spjd{
6127219089Spjd	int error;
6128219089Spjd
6129219089Spjd	spa_init(FREAD | FWRITE);
6130219089Spjd	zfs_init();
6131219089Spjd	zvol_init();
6132248571Smm	zfs_ioctl_init();
6133219089Spjd
6134219089Spjd	if ((error = mod_install(&modlinkage)) != 0) {
6135219089Spjd		zvol_fini();
6136219089Spjd		zfs_fini();
6137219089Spjd		spa_fini();
6138219089Spjd		return (error);
6139219089Spjd	}
6140219089Spjd
6141219089Spjd	tsd_create(&zfs_fsyncer_key, NULL);
6142248571Smm	tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
6143248571Smm	tsd_create(&zfs_allow_log_key, zfs_allow_log_destroy);
6144219089Spjd
6145219089Spjd	error = ldi_ident_from_mod(&modlinkage, &zfs_li);
6146219089Spjd	ASSERT(error == 0);
6147219089Spjd	mutex_init(&zfs_share_lock, NULL, MUTEX_DEFAULT, NULL);
6148219089Spjd
6149219089Spjd	return (0);
6150219089Spjd}
6151219089Spjd
6152219089Spjdint
6153219089Spjd_fini(void)
6154219089Spjd{
6155219089Spjd	int error;
6156219089Spjd
6157219089Spjd	if (spa_busy() || zfs_busy() || zvol_busy() || zio_injection_enabled)
6158249195Smm		return (SET_ERROR(EBUSY));
6159219089Spjd
6160219089Spjd	if ((error = mod_remove(&modlinkage)) != 0)
6161219089Spjd		return (error);
6162219089Spjd
6163219089Spjd	zvol_fini();
6164219089Spjd	zfs_fini();
6165219089Spjd	spa_fini();
6166219089Spjd	if (zfs_nfsshare_inited)
6167219089Spjd		(void) ddi_modclose(nfs_mod);
6168219089Spjd	if (zfs_smbshare_inited)
6169219089Spjd		(void) ddi_modclose(smbsrv_mod);
6170219089Spjd	if (zfs_nfsshare_inited || zfs_smbshare_inited)
6171219089Spjd		(void) ddi_modclose(sharefs_mod);
6172219089Spjd
6173219089Spjd	tsd_destroy(&zfs_fsyncer_key);
6174219089Spjd	ldi_ident_release(zfs_li);
6175219089Spjd	zfs_li = NULL;
6176219089Spjd	mutex_destroy(&zfs_share_lock);
6177219089Spjd
6178219089Spjd	return (error);
6179219089Spjd}
6180219089Spjd
6181219089Spjdint
6182219089Spjd_info(struct modinfo *modinfop)
6183219089Spjd{
6184219089Spjd	return (mod_info(&modlinkage, modinfop));
6185219089Spjd}
6186219089Spjd#endif	/* sun */
6187219089Spjd
6188168404Spjdstatic int
6189168404Spjdzfs_modevent(module_t mod, int type, void *unused __unused)
6190168404Spjd{
6191196291Spjd	int error = 0;
6192168404Spjd
6193168404Spjd	switch (type) {
6194168404Spjd	case MOD_LOAD:
6195190878Sthompsa		zfs_root_token = root_mount_hold("ZFS");
6196196291Spjd
6197185029Spjd		mutex_init(&zfs_share_lock, NULL, MUTEX_DEFAULT, NULL);
6198196291Spjd
6199196291Spjd		spa_init(FREAD | FWRITE);
6200196291Spjd		zfs_init();
6201196291Spjd		zvol_init();
6202248571Smm		zfs_ioctl_init();
6203196291Spjd
6204196291Spjd		tsd_create(&zfs_fsyncer_key, NULL);
6205248571Smm		tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
6206248571Smm		tsd_create(&zfs_allow_log_key, zfs_allow_log_destroy);
6207196291Spjd
6208236884Smm		printf("ZFS storage pool version: features support (" SPA_VERSION_STRING ")\n");
6209196291Spjd		root_mount_rel(zfs_root_token);
6210196291Spjd
6211196291Spjd		zfsdev_init();
6212168404Spjd		break;
6213168404Spjd	case MOD_UNLOAD:
6214168775Spjd		if (spa_busy() || zfs_busy() || zvol_busy() ||
6215168404Spjd		    zio_injection_enabled) {
6216168404Spjd			error = EBUSY;
6217168404Spjd			break;
6218168404Spjd		}
6219196291Spjd
6220196291Spjd		zfsdev_fini();
6221168404Spjd		zvol_fini();
6222168404Spjd		zfs_fini();
6223168404Spjd		spa_fini();
6224196291Spjd
6225185029Spjd		tsd_destroy(&zfs_fsyncer_key);
6226185029Spjd		tsd_destroy(&rrw_tsd_key);
6227248571Smm		tsd_destroy(&zfs_allow_log_key);
6228196291Spjd
6229185029Spjd		mutex_destroy(&zfs_share_lock);
6230168404Spjd		break;
6231196291Spjd	default:
6232196291Spjd		error = EOPNOTSUPP;
6233196291Spjd		break;
6234168404Spjd	}
6235168404Spjd	return (error);
6236168404Spjd}
6237168404Spjd
6238168404Spjdstatic moduledata_t zfs_mod = {
6239168404Spjd	"zfsctrl",
6240168404Spjd	zfs_modevent,
6241241394Skevlo	0
6242168404Spjd};
6243169929SpjdDECLARE_MODULE(zfsctrl, zfs_mod, SI_SUB_VFS, SI_ORDER_ANY);
6244246242SavgMODULE_VERSION(zfsctrl, 1);
6245179280SjbMODULE_DEPEND(zfsctrl, opensolaris, 1, 1, 1);
6246193128SkmacyMODULE_DEPEND(zfsctrl, krpc, 1, 1, 1);
6247232938SadrianMODULE_DEPEND(zfsctrl, acl_nfs4, 1, 1, 1);
6248