]> git.proxmox.com Git - mirror_zfs-debian.git/blob - module/zfs/zfs_ioctl.c
Illumos #1948: zpool list should show more detailed pool info
[mirror_zfs-debian.git] / module / zfs / zfs_ioctl.c
1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21 /*
22 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
23 * Portions Copyright 2011 Martin Matuska
24 * Portions Copyright 2012 Pawel Jakub Dawidek <pawel@dawidek.net>
25 * Copyright (c) 2012, Joyent, Inc. All rights reserved.
26 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
27 * Copyright (c) 2012 by Delphix. All rights reserved.
28 */
29
30 #include <sys/types.h>
31 #include <sys/param.h>
32 #include <sys/errno.h>
33 #include <sys/uio.h>
34 #include <sys/buf.h>
35 #include <sys/modctl.h>
36 #include <sys/open.h>
37 #include <sys/file.h>
38 #include <sys/kmem.h>
39 #include <sys/conf.h>
40 #include <sys/cmn_err.h>
41 #include <sys/stat.h>
42 #include <sys/zfs_ioctl.h>
43 #include <sys/zfs_vfsops.h>
44 #include <sys/zfs_znode.h>
45 #include <sys/zap.h>
46 #include <sys/spa.h>
47 #include <sys/spa_impl.h>
48 #include <sys/vdev.h>
49 #include <sys/priv_impl.h>
50 #include <sys/dmu.h>
51 #include <sys/dsl_dir.h>
52 #include <sys/dsl_dataset.h>
53 #include <sys/dsl_prop.h>
54 #include <sys/dsl_deleg.h>
55 #include <sys/dmu_objset.h>
56 #include <sys/ddi.h>
57 #include <sys/sunddi.h>
58 #include <sys/sunldi.h>
59 #include <sys/policy.h>
60 #include <sys/zone.h>
61 #include <sys/nvpair.h>
62 #include <sys/pathname.h>
63 #include <sys/mount.h>
64 #include <sys/sdt.h>
65 #include <sys/fs/zfs.h>
66 #include <sys/zfs_ctldir.h>
67 #include <sys/zfs_dir.h>
68 #include <sys/zfs_onexit.h>
69 #include <sys/zvol.h>
70 #include <sys/dsl_scan.h>
71 #include <sharefs/share.h>
72 #include <sys/dmu_objset.h>
73 #include <sys/fm/util.h>
74
75 #include <linux/miscdevice.h>
76
77 #include "zfs_namecheck.h"
78 #include "zfs_prop.h"
79 #include "zfs_deleg.h"
80 #include "zfs_comutil.h"
81
82 kmutex_t zfsdev_state_lock;
83 list_t zfsdev_state_list;
84
85 extern void zfs_init(void);
86 extern void zfs_fini(void);
87
88 typedef int zfs_ioc_func_t(zfs_cmd_t *);
89 typedef int zfs_secpolicy_func_t(zfs_cmd_t *, cred_t *);
90
91 typedef enum {
92 NO_NAME,
93 POOL_NAME,
94 DATASET_NAME
95 } zfs_ioc_namecheck_t;
96
97 typedef enum {
98 POOL_CHECK_NONE = 1 << 0,
99 POOL_CHECK_SUSPENDED = 1 << 1,
100 POOL_CHECK_READONLY = 1 << 2
101 } zfs_ioc_poolcheck_t;
102
103 typedef struct zfs_ioc_vec {
104 zfs_ioc_func_t *zvec_func;
105 zfs_secpolicy_func_t *zvec_secpolicy;
106 zfs_ioc_namecheck_t zvec_namecheck;
107 boolean_t zvec_his_log;
108 zfs_ioc_poolcheck_t zvec_pool_check;
109 } zfs_ioc_vec_t;
110
111 /* This array is indexed by zfs_userquota_prop_t */
112 static const char *userquota_perms[] = {
113 ZFS_DELEG_PERM_USERUSED,
114 ZFS_DELEG_PERM_USERQUOTA,
115 ZFS_DELEG_PERM_GROUPUSED,
116 ZFS_DELEG_PERM_GROUPQUOTA,
117 };
118
119 static int zfs_ioc_userspace_upgrade(zfs_cmd_t *zc);
120 static int zfs_check_settable(const char *name, nvpair_t *property,
121 cred_t *cr);
122 static int zfs_check_clearable(char *dataset, nvlist_t *props,
123 nvlist_t **errors);
124 static int zfs_fill_zplprops_root(uint64_t, nvlist_t *, nvlist_t *,
125 boolean_t *);
126 int zfs_set_prop_nvlist(const char *, zprop_source_t, nvlist_t *, nvlist_t **);
127
128 static void
129 history_str_free(char *buf)
130 {
131 kmem_free(buf, HIS_MAX_RECORD_LEN);
132 }
133
134 static char *
135 history_str_get(zfs_cmd_t *zc)
136 {
137 char *buf;
138
139 if (zc->zc_history == 0)
140 return (NULL);
141
142 buf = kmem_alloc(HIS_MAX_RECORD_LEN, KM_SLEEP | KM_NODEBUG);
143 if (copyinstr((void *)(uintptr_t)zc->zc_history,
144 buf, HIS_MAX_RECORD_LEN, NULL) != 0) {
145 history_str_free(buf);
146 return (NULL);
147 }
148
149 buf[HIS_MAX_RECORD_LEN -1] = '\0';
150
151 return (buf);
152 }
153
154 /*
155 * Check to see if the named dataset is currently defined as bootable
156 */
157 static boolean_t
158 zfs_is_bootfs(const char *name)
159 {
160 objset_t *os;
161
162 if (dmu_objset_hold(name, FTAG, &os) == 0) {
163 boolean_t ret;
164 ret = (dmu_objset_id(os) == spa_bootfs(dmu_objset_spa(os)));
165 dmu_objset_rele(os, FTAG);
166 return (ret);
167 }
168 return (B_FALSE);
169 }
170
171 /*
172 * zfs_earlier_version
173 *
174 * Return non-zero if the spa version is less than requested version.
175 */
176 static int
177 zfs_earlier_version(const char *name, int version)
178 {
179 spa_t *spa;
180
181 if (spa_open(name, &spa, FTAG) == 0) {
182 if (spa_version(spa) < version) {
183 spa_close(spa, FTAG);
184 return (1);
185 }
186 spa_close(spa, FTAG);
187 }
188 return (0);
189 }
190
191 /*
192 * zpl_earlier_version
193 *
194 * Return TRUE if the ZPL version is less than requested version.
195 */
196 static boolean_t
197 zpl_earlier_version(const char *name, int version)
198 {
199 objset_t *os;
200 boolean_t rc = B_TRUE;
201
202 if (dmu_objset_hold(name, FTAG, &os) == 0) {
203 uint64_t zplversion;
204
205 if (dmu_objset_type(os) != DMU_OST_ZFS) {
206 dmu_objset_rele(os, FTAG);
207 return (B_TRUE);
208 }
209 /* XXX reading from non-owned objset */
210 if (zfs_get_zplprop(os, ZFS_PROP_VERSION, &zplversion) == 0)
211 rc = zplversion < version;
212 dmu_objset_rele(os, FTAG);
213 }
214 return (rc);
215 }
216
217 static void
218 zfs_log_history(zfs_cmd_t *zc)
219 {
220 spa_t *spa;
221 char *buf;
222
223 if ((buf = history_str_get(zc)) == NULL)
224 return;
225
226 if (spa_open(zc->zc_name, &spa, FTAG) == 0) {
227 if (spa_version(spa) >= SPA_VERSION_ZPOOL_HISTORY)
228 (void) spa_history_log(spa, buf, LOG_CMD_NORMAL);
229 spa_close(spa, FTAG);
230 }
231 history_str_free(buf);
232 }
233
234 /*
235 * Policy for top-level read operations (list pools). Requires no privileges,
236 * and can be used in the local zone, as there is no associated dataset.
237 */
238 /* ARGSUSED */
239 static int
240 zfs_secpolicy_none(zfs_cmd_t *zc, cred_t *cr)
241 {
242 return (0);
243 }
244
245 /*
246 * Policy for dataset read operations (list children, get statistics). Requires
247 * no privileges, but must be visible in the local zone.
248 */
249 /* ARGSUSED */
250 static int
251 zfs_secpolicy_read(zfs_cmd_t *zc, cred_t *cr)
252 {
253 if (INGLOBALZONE(curproc) ||
254 zone_dataset_visible(zc->zc_name, NULL))
255 return (0);
256
257 return (ENOENT);
258 }
259
260 static int
261 zfs_dozonecheck_impl(const char *dataset, uint64_t zoned, cred_t *cr)
262 {
263 int writable = 1;
264
265 /*
266 * The dataset must be visible by this zone -- check this first
267 * so they don't see EPERM on something they shouldn't know about.
268 */
269 if (!INGLOBALZONE(curproc) &&
270 !zone_dataset_visible(dataset, &writable))
271 return (ENOENT);
272
273 if (INGLOBALZONE(curproc)) {
274 /*
275 * If the fs is zoned, only root can access it from the
276 * global zone.
277 */
278 if (secpolicy_zfs(cr) && zoned)
279 return (EPERM);
280 } else {
281 /*
282 * If we are in a local zone, the 'zoned' property must be set.
283 */
284 if (!zoned)
285 return (EPERM);
286
287 /* must be writable by this zone */
288 if (!writable)
289 return (EPERM);
290 }
291 return (0);
292 }
293
294 static int
295 zfs_dozonecheck(const char *dataset, cred_t *cr)
296 {
297 uint64_t zoned;
298
299 if (dsl_prop_get_integer(dataset, "zoned", &zoned, NULL))
300 return (ENOENT);
301
302 return (zfs_dozonecheck_impl(dataset, zoned, cr));
303 }
304
305 static int
306 zfs_dozonecheck_ds(const char *dataset, dsl_dataset_t *ds, cred_t *cr)
307 {
308 uint64_t zoned;
309
310 rw_enter(&ds->ds_dir->dd_pool->dp_config_rwlock, RW_READER);
311 if (dsl_prop_get_ds(ds, "zoned", 8, 1, &zoned, NULL)) {
312 rw_exit(&ds->ds_dir->dd_pool->dp_config_rwlock);
313 return (ENOENT);
314 }
315 rw_exit(&ds->ds_dir->dd_pool->dp_config_rwlock);
316
317 return (zfs_dozonecheck_impl(dataset, zoned, cr));
318 }
319
320 /*
321 * If name ends in a '@', then require recursive permissions.
322 */
323 int
324 zfs_secpolicy_write_perms(const char *name, const char *perm, cred_t *cr)
325 {
326 int error;
327 boolean_t descendent = B_FALSE;
328 dsl_dataset_t *ds;
329 char *at;
330
331 at = strchr(name, '@');
332 if (at != NULL && at[1] == '\0') {
333 *at = '\0';
334 descendent = B_TRUE;
335 }
336
337 error = dsl_dataset_hold(name, FTAG, &ds);
338 if (at != NULL)
339 *at = '@';
340 if (error != 0)
341 return (error);
342
343 error = zfs_dozonecheck_ds(name, ds, cr);
344 if (error == 0) {
345 error = secpolicy_zfs(cr);
346 if (error)
347 error = dsl_deleg_access_impl(ds, descendent, perm, cr);
348 }
349
350 dsl_dataset_rele(ds, FTAG);
351 return (error);
352 }
353
354 int
355 zfs_secpolicy_write_perms_ds(const char *name, dsl_dataset_t *ds,
356 const char *perm, cred_t *cr)
357 {
358 int error;
359
360 error = zfs_dozonecheck_ds(name, ds, cr);
361 if (error == 0) {
362 error = secpolicy_zfs(cr);
363 if (error)
364 error = dsl_deleg_access_impl(ds, B_FALSE, perm, cr);
365 }
366 return (error);
367 }
368
369 /*
370 * Policy for setting the security label property.
371 *
372 * Returns 0 for success, non-zero for access and other errors.
373 */
374 static int
375 zfs_set_slabel_policy(const char *name, char *strval, cred_t *cr)
376 {
377 #ifdef HAVE_MLSLABEL
378 char ds_hexsl[MAXNAMELEN];
379 bslabel_t ds_sl, new_sl;
380 boolean_t new_default = FALSE;
381 uint64_t zoned;
382 int needed_priv = -1;
383 int error;
384
385 /* First get the existing dataset label. */
386 error = dsl_prop_get(name, zfs_prop_to_name(ZFS_PROP_MLSLABEL),
387 1, sizeof (ds_hexsl), &ds_hexsl, NULL);
388 if (error)
389 return (EPERM);
390
391 if (strcasecmp(strval, ZFS_MLSLABEL_DEFAULT) == 0)
392 new_default = TRUE;
393
394 /* The label must be translatable */
395 if (!new_default && (hexstr_to_label(strval, &new_sl) != 0))
396 return (EINVAL);
397
398 /*
399 * In a non-global zone, disallow attempts to set a label that
400 * doesn't match that of the zone; otherwise no other checks
401 * are needed.
402 */
403 if (!INGLOBALZONE(curproc)) {
404 if (new_default || !blequal(&new_sl, CR_SL(CRED())))
405 return (EPERM);
406 return (0);
407 }
408
409 /*
410 * For global-zone datasets (i.e., those whose zoned property is
411 * "off", verify that the specified new label is valid for the
412 * global zone.
413 */
414 if (dsl_prop_get_integer(name,
415 zfs_prop_to_name(ZFS_PROP_ZONED), &zoned, NULL))
416 return (EPERM);
417 if (!zoned) {
418 if (zfs_check_global_label(name, strval) != 0)
419 return (EPERM);
420 }
421
422 /*
423 * If the existing dataset label is nondefault, check if the
424 * dataset is mounted (label cannot be changed while mounted).
425 * Get the zfs_sb_t; if there isn't one, then the dataset isn't
426 * mounted (or isn't a dataset, doesn't exist, ...).
427 */
428 if (strcasecmp(ds_hexsl, ZFS_MLSLABEL_DEFAULT) != 0) {
429 objset_t *os;
430 static char *setsl_tag = "setsl_tag";
431
432 /*
433 * Try to own the dataset; abort if there is any error,
434 * (e.g., already mounted, in use, or other error).
435 */
436 error = dmu_objset_own(name, DMU_OST_ZFS, B_TRUE,
437 setsl_tag, &os);
438 if (error)
439 return (EPERM);
440
441 dmu_objset_disown(os, setsl_tag);
442
443 if (new_default) {
444 needed_priv = PRIV_FILE_DOWNGRADE_SL;
445 goto out_check;
446 }
447
448 if (hexstr_to_label(strval, &new_sl) != 0)
449 return (EPERM);
450
451 if (blstrictdom(&ds_sl, &new_sl))
452 needed_priv = PRIV_FILE_DOWNGRADE_SL;
453 else if (blstrictdom(&new_sl, &ds_sl))
454 needed_priv = PRIV_FILE_UPGRADE_SL;
455 } else {
456 /* dataset currently has a default label */
457 if (!new_default)
458 needed_priv = PRIV_FILE_UPGRADE_SL;
459 }
460
461 out_check:
462 if (needed_priv != -1)
463 return (PRIV_POLICY(cr, needed_priv, B_FALSE, EPERM, NULL));
464 return (0);
465 #else
466 return ENOTSUP;
467 #endif /* HAVE_MLSLABEL */
468 }
469
470 static int
471 zfs_secpolicy_setprop(const char *dsname, zfs_prop_t prop, nvpair_t *propval,
472 cred_t *cr)
473 {
474 char *strval;
475
476 /*
477 * Check permissions for special properties.
478 */
479 switch (prop) {
480 default:
481 break;
482 case ZFS_PROP_ZONED:
483 /*
484 * Disallow setting of 'zoned' from within a local zone.
485 */
486 if (!INGLOBALZONE(curproc))
487 return (EPERM);
488 break;
489
490 case ZFS_PROP_QUOTA:
491 if (!INGLOBALZONE(curproc)) {
492 uint64_t zoned;
493 char setpoint[MAXNAMELEN];
494 /*
495 * Unprivileged users are allowed to modify the
496 * quota on things *under* (ie. contained by)
497 * the thing they own.
498 */
499 if (dsl_prop_get_integer(dsname, "zoned", &zoned,
500 setpoint))
501 return (EPERM);
502 if (!zoned || strlen(dsname) <= strlen(setpoint))
503 return (EPERM);
504 }
505 break;
506
507 case ZFS_PROP_MLSLABEL:
508 if (!is_system_labeled())
509 return (EPERM);
510
511 if (nvpair_value_string(propval, &strval) == 0) {
512 int err;
513
514 err = zfs_set_slabel_policy(dsname, strval, CRED());
515 if (err != 0)
516 return (err);
517 }
518 break;
519 }
520
521 return (zfs_secpolicy_write_perms(dsname, zfs_prop_to_name(prop), cr));
522 }
523
524 int
525 zfs_secpolicy_fsacl(zfs_cmd_t *zc, cred_t *cr)
526 {
527 int error;
528
529 error = zfs_dozonecheck(zc->zc_name, cr);
530 if (error)
531 return (error);
532
533 /*
534 * permission to set permissions will be evaluated later in
535 * dsl_deleg_can_allow()
536 */
537 return (0);
538 }
539
540 int
541 zfs_secpolicy_rollback(zfs_cmd_t *zc, cred_t *cr)
542 {
543 return (zfs_secpolicy_write_perms(zc->zc_name,
544 ZFS_DELEG_PERM_ROLLBACK, cr));
545 }
546
547 int
548 zfs_secpolicy_send(zfs_cmd_t *zc, cred_t *cr)
549 {
550 spa_t *spa;
551 dsl_pool_t *dp;
552 dsl_dataset_t *ds;
553 char *cp;
554 int error;
555
556 /*
557 * Generate the current snapshot name from the given objsetid, then
558 * use that name for the secpolicy/zone checks.
559 */
560 cp = strchr(zc->zc_name, '@');
561 if (cp == NULL)
562 return (EINVAL);
563 error = spa_open(zc->zc_name, &spa, FTAG);
564 if (error)
565 return (error);
566
567 dp = spa_get_dsl(spa);
568 rw_enter(&dp->dp_config_rwlock, RW_READER);
569 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
570 rw_exit(&dp->dp_config_rwlock);
571 spa_close(spa, FTAG);
572 if (error)
573 return (error);
574
575 dsl_dataset_name(ds, zc->zc_name);
576
577 error = zfs_secpolicy_write_perms_ds(zc->zc_name, ds,
578 ZFS_DELEG_PERM_SEND, cr);
579 dsl_dataset_rele(ds, FTAG);
580
581 return (error);
582 }
583
584 #ifdef HAVE_SMB_SHARE
585 static int
586 zfs_secpolicy_deleg_share(zfs_cmd_t *zc, cred_t *cr)
587 {
588 vnode_t *vp;
589 int error;
590
591 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
592 NO_FOLLOW, NULL, &vp)) != 0)
593 return (error);
594
595 /* Now make sure mntpnt and dataset are ZFS */
596
597 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
598 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
599 zc->zc_name) != 0)) {
600 VN_RELE(vp);
601 return (EPERM);
602 }
603
604 VN_RELE(vp);
605 return (dsl_deleg_access(zc->zc_name,
606 ZFS_DELEG_PERM_SHARE, cr));
607 }
608 #endif /* HAVE_SMB_SHARE */
609
610 int
611 zfs_secpolicy_share(zfs_cmd_t *zc, cred_t *cr)
612 {
613 #ifdef HAVE_SMB_SHARE
614 if (!INGLOBALZONE(curproc))
615 return (EPERM);
616
617 if (secpolicy_nfs(cr) == 0) {
618 return (0);
619 } else {
620 return (zfs_secpolicy_deleg_share(zc, cr));
621 }
622 #else
623 return (ENOTSUP);
624 #endif /* HAVE_SMB_SHARE */
625 }
626
627 int
628 zfs_secpolicy_smb_acl(zfs_cmd_t *zc, cred_t *cr)
629 {
630 #ifdef HAVE_SMB_SHARE
631 if (!INGLOBALZONE(curproc))
632 return (EPERM);
633
634 if (secpolicy_smb(cr) == 0) {
635 return (0);
636 } else {
637 return (zfs_secpolicy_deleg_share(zc, cr));
638 }
639 #else
640 return (ENOTSUP);
641 #endif /* HAVE_SMB_SHARE */
642 }
643
644 static int
645 zfs_get_parent(const char *datasetname, char *parent, int parentsize)
646 {
647 char *cp;
648
649 /*
650 * Remove the @bla or /bla from the end of the name to get the parent.
651 */
652 (void) strncpy(parent, datasetname, parentsize);
653 cp = strrchr(parent, '@');
654 if (cp != NULL) {
655 cp[0] = '\0';
656 } else {
657 cp = strrchr(parent, '/');
658 if (cp == NULL)
659 return (ENOENT);
660 cp[0] = '\0';
661 }
662
663 return (0);
664 }
665
666 int
667 zfs_secpolicy_destroy_perms(const char *name, cred_t *cr)
668 {
669 int error;
670
671 if ((error = zfs_secpolicy_write_perms(name,
672 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
673 return (error);
674
675 return (zfs_secpolicy_write_perms(name, ZFS_DELEG_PERM_DESTROY, cr));
676 }
677
678 static int
679 zfs_secpolicy_destroy(zfs_cmd_t *zc, cred_t *cr)
680 {
681 return (zfs_secpolicy_destroy_perms(zc->zc_name, cr));
682 }
683
684 /*
685 * Destroying snapshots with delegated permissions requires
686 * descendent mount and destroy permissions.
687 */
688 static int
689 zfs_secpolicy_destroy_recursive(zfs_cmd_t *zc, cred_t *cr)
690 {
691 int error;
692 char *dsname;
693
694 dsname = kmem_asprintf("%s@", zc->zc_name);
695
696 error = zfs_secpolicy_destroy_perms(dsname, cr);
697 if (error == ENOENT)
698 error = zfs_secpolicy_destroy_perms(zc->zc_name, cr);
699
700 strfree(dsname);
701 return (error);
702 }
703
704 int
705 zfs_secpolicy_rename_perms(const char *from, const char *to, cred_t *cr)
706 {
707 char parentname[MAXNAMELEN];
708 int error;
709
710 if ((error = zfs_secpolicy_write_perms(from,
711 ZFS_DELEG_PERM_RENAME, cr)) != 0)
712 return (error);
713
714 if ((error = zfs_secpolicy_write_perms(from,
715 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
716 return (error);
717
718 if ((error = zfs_get_parent(to, parentname,
719 sizeof (parentname))) != 0)
720 return (error);
721
722 if ((error = zfs_secpolicy_write_perms(parentname,
723 ZFS_DELEG_PERM_CREATE, cr)) != 0)
724 return (error);
725
726 if ((error = zfs_secpolicy_write_perms(parentname,
727 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
728 return (error);
729
730 return (error);
731 }
732
733 static int
734 zfs_secpolicy_rename(zfs_cmd_t *zc, cred_t *cr)
735 {
736 return (zfs_secpolicy_rename_perms(zc->zc_name, zc->zc_value, cr));
737 }
738
739 static int
740 zfs_secpolicy_promote(zfs_cmd_t *zc, cred_t *cr)
741 {
742 char parentname[MAXNAMELEN];
743 objset_t *clone;
744 int error;
745
746 error = zfs_secpolicy_write_perms(zc->zc_name,
747 ZFS_DELEG_PERM_PROMOTE, cr);
748 if (error)
749 return (error);
750
751 error = dmu_objset_hold(zc->zc_name, FTAG, &clone);
752
753 if (error == 0) {
754 dsl_dataset_t *pclone = NULL;
755 dsl_dir_t *dd;
756 dd = clone->os_dsl_dataset->ds_dir;
757
758 rw_enter(&dd->dd_pool->dp_config_rwlock, RW_READER);
759 error = dsl_dataset_hold_obj(dd->dd_pool,
760 dd->dd_phys->dd_origin_obj, FTAG, &pclone);
761 rw_exit(&dd->dd_pool->dp_config_rwlock);
762 if (error) {
763 dmu_objset_rele(clone, FTAG);
764 return (error);
765 }
766
767 error = zfs_secpolicy_write_perms(zc->zc_name,
768 ZFS_DELEG_PERM_MOUNT, cr);
769
770 dsl_dataset_name(pclone, parentname);
771 dmu_objset_rele(clone, FTAG);
772 dsl_dataset_rele(pclone, FTAG);
773 if (error == 0)
774 error = zfs_secpolicy_write_perms(parentname,
775 ZFS_DELEG_PERM_PROMOTE, cr);
776 }
777 return (error);
778 }
779
780 static int
781 zfs_secpolicy_receive(zfs_cmd_t *zc, cred_t *cr)
782 {
783 int error;
784
785 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
786 ZFS_DELEG_PERM_RECEIVE, cr)) != 0)
787 return (error);
788
789 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
790 ZFS_DELEG_PERM_MOUNT, cr)) != 0)
791 return (error);
792
793 return (zfs_secpolicy_write_perms(zc->zc_name,
794 ZFS_DELEG_PERM_CREATE, cr));
795 }
796
797 int
798 zfs_secpolicy_snapshot_perms(const char *name, cred_t *cr)
799 {
800 return (zfs_secpolicy_write_perms(name,
801 ZFS_DELEG_PERM_SNAPSHOT, cr));
802 }
803
804 static int
805 zfs_secpolicy_snapshot(zfs_cmd_t *zc, cred_t *cr)
806 {
807
808 return (zfs_secpolicy_snapshot_perms(zc->zc_name, cr));
809 }
810
811 static int
812 zfs_secpolicy_create(zfs_cmd_t *zc, cred_t *cr)
813 {
814 char parentname[MAXNAMELEN];
815 int error;
816
817 if ((error = zfs_get_parent(zc->zc_name, parentname,
818 sizeof (parentname))) != 0)
819 return (error);
820
821 if (zc->zc_value[0] != '\0') {
822 if ((error = zfs_secpolicy_write_perms(zc->zc_value,
823 ZFS_DELEG_PERM_CLONE, cr)) != 0)
824 return (error);
825 }
826
827 if ((error = zfs_secpolicy_write_perms(parentname,
828 ZFS_DELEG_PERM_CREATE, cr)) != 0)
829 return (error);
830
831 error = zfs_secpolicy_write_perms(parentname,
832 ZFS_DELEG_PERM_MOUNT, cr);
833
834 return (error);
835 }
836
837 /*
838 * Policy for pool operations - create/destroy pools, add vdevs, etc. Requires
839 * SYS_CONFIG privilege, which is not available in a local zone.
840 */
841 /* ARGSUSED */
842 static int
843 zfs_secpolicy_config(zfs_cmd_t *zc, cred_t *cr)
844 {
845 if (secpolicy_sys_config(cr, B_FALSE) != 0)
846 return (EPERM);
847
848 return (0);
849 }
850
851 /*
852 * Policy for object to name lookups.
853 */
854 /* ARGSUSED */
855 static int
856 zfs_secpolicy_diff(zfs_cmd_t *zc, cred_t *cr)
857 {
858 int error;
859
860 if ((error = secpolicy_sys_config(cr, B_FALSE)) == 0)
861 return (0);
862
863 error = zfs_secpolicy_write_perms(zc->zc_name, ZFS_DELEG_PERM_DIFF, cr);
864 return (error);
865 }
866
867 /*
868 * Policy for fault injection. Requires all privileges.
869 */
870 /* ARGSUSED */
871 static int
872 zfs_secpolicy_inject(zfs_cmd_t *zc, cred_t *cr)
873 {
874 return (secpolicy_zinject(cr));
875 }
876
877 static int
878 zfs_secpolicy_inherit(zfs_cmd_t *zc, cred_t *cr)
879 {
880 zfs_prop_t prop = zfs_name_to_prop(zc->zc_value);
881
882 if (prop == ZPROP_INVAL) {
883 if (!zfs_prop_user(zc->zc_value))
884 return (EINVAL);
885 return (zfs_secpolicy_write_perms(zc->zc_name,
886 ZFS_DELEG_PERM_USERPROP, cr));
887 } else {
888 return (zfs_secpolicy_setprop(zc->zc_name, prop,
889 NULL, cr));
890 }
891 }
892
893 static int
894 zfs_secpolicy_userspace_one(zfs_cmd_t *zc, cred_t *cr)
895 {
896 int err = zfs_secpolicy_read(zc, cr);
897 if (err)
898 return (err);
899
900 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
901 return (EINVAL);
902
903 if (zc->zc_value[0] == 0) {
904 /*
905 * They are asking about a posix uid/gid. If it's
906 * themself, allow it.
907 */
908 if (zc->zc_objset_type == ZFS_PROP_USERUSED ||
909 zc->zc_objset_type == ZFS_PROP_USERQUOTA) {
910 if (zc->zc_guid == crgetuid(cr))
911 return (0);
912 } else {
913 if (groupmember(zc->zc_guid, cr))
914 return (0);
915 }
916 }
917
918 return (zfs_secpolicy_write_perms(zc->zc_name,
919 userquota_perms[zc->zc_objset_type], cr));
920 }
921
922 static int
923 zfs_secpolicy_userspace_many(zfs_cmd_t *zc, cred_t *cr)
924 {
925 int err = zfs_secpolicy_read(zc, cr);
926 if (err)
927 return (err);
928
929 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
930 return (EINVAL);
931
932 return (zfs_secpolicy_write_perms(zc->zc_name,
933 userquota_perms[zc->zc_objset_type], cr));
934 }
935
936 static int
937 zfs_secpolicy_userspace_upgrade(zfs_cmd_t *zc, cred_t *cr)
938 {
939 return (zfs_secpolicy_setprop(zc->zc_name, ZFS_PROP_VERSION,
940 NULL, cr));
941 }
942
943 static int
944 zfs_secpolicy_hold(zfs_cmd_t *zc, cred_t *cr)
945 {
946 return (zfs_secpolicy_write_perms(zc->zc_name,
947 ZFS_DELEG_PERM_HOLD, cr));
948 }
949
950 static int
951 zfs_secpolicy_release(zfs_cmd_t *zc, cred_t *cr)
952 {
953 return (zfs_secpolicy_write_perms(zc->zc_name,
954 ZFS_DELEG_PERM_RELEASE, cr));
955 }
956
957 /*
958 * Policy for allowing temporary snapshots to be taken or released
959 */
960 static int
961 zfs_secpolicy_tmp_snapshot(zfs_cmd_t *zc, cred_t *cr)
962 {
963 /*
964 * A temporary snapshot is the same as a snapshot,
965 * hold, destroy and release all rolled into one.
966 * Delegated diff alone is sufficient that we allow this.
967 */
968 int error;
969
970 if ((error = zfs_secpolicy_write_perms(zc->zc_name,
971 ZFS_DELEG_PERM_DIFF, cr)) == 0)
972 return (0);
973
974 error = zfs_secpolicy_snapshot(zc, cr);
975 if (!error)
976 error = zfs_secpolicy_hold(zc, cr);
977 if (!error)
978 error = zfs_secpolicy_release(zc, cr);
979 if (!error)
980 error = zfs_secpolicy_destroy(zc, cr);
981 return (error);
982 }
983
984 /*
985 * Returns the nvlist as specified by the user in the zfs_cmd_t.
986 */
987 static int
988 get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp)
989 {
990 char *packed;
991 int error;
992 nvlist_t *list = NULL;
993
994 /*
995 * Read in and unpack the user-supplied nvlist.
996 */
997 if (size == 0)
998 return (EINVAL);
999
1000 packed = kmem_alloc(size, KM_SLEEP | KM_NODEBUG);
1001
1002 if ((error = ddi_copyin((void *)(uintptr_t)nvl, packed, size,
1003 iflag)) != 0) {
1004 kmem_free(packed, size);
1005 return (error);
1006 }
1007
1008 if ((error = nvlist_unpack(packed, size, &list, 0)) != 0) {
1009 kmem_free(packed, size);
1010 return (error);
1011 }
1012
1013 kmem_free(packed, size);
1014
1015 *nvp = list;
1016 return (0);
1017 }
1018
1019 static int
1020 fit_error_list(zfs_cmd_t *zc, nvlist_t **errors)
1021 {
1022 size_t size;
1023
1024 VERIFY(nvlist_size(*errors, &size, NV_ENCODE_NATIVE) == 0);
1025
1026 if (size > zc->zc_nvlist_dst_size) {
1027 nvpair_t *more_errors;
1028 int n = 0;
1029
1030 if (zc->zc_nvlist_dst_size < 1024)
1031 return (ENOMEM);
1032
1033 VERIFY(nvlist_add_int32(*errors, ZPROP_N_MORE_ERRORS, 0) == 0);
1034 more_errors = nvlist_prev_nvpair(*errors, NULL);
1035
1036 do {
1037 nvpair_t *pair = nvlist_prev_nvpair(*errors,
1038 more_errors);
1039 VERIFY(nvlist_remove_nvpair(*errors, pair) == 0);
1040 n++;
1041 VERIFY(nvlist_size(*errors, &size,
1042 NV_ENCODE_NATIVE) == 0);
1043 } while (size > zc->zc_nvlist_dst_size);
1044
1045 VERIFY(nvlist_remove_nvpair(*errors, more_errors) == 0);
1046 VERIFY(nvlist_add_int32(*errors, ZPROP_N_MORE_ERRORS, n) == 0);
1047 ASSERT(nvlist_size(*errors, &size, NV_ENCODE_NATIVE) == 0);
1048 ASSERT(size <= zc->zc_nvlist_dst_size);
1049 }
1050
1051 return (0);
1052 }
1053
1054 static int
1055 put_nvlist(zfs_cmd_t *zc, nvlist_t *nvl)
1056 {
1057 char *packed = NULL;
1058 int error = 0;
1059 size_t size;
1060
1061 VERIFY(nvlist_size(nvl, &size, NV_ENCODE_NATIVE) == 0);
1062
1063 if (size > zc->zc_nvlist_dst_size) {
1064 error = ENOMEM;
1065 } else {
1066 packed = kmem_alloc(size, KM_SLEEP | KM_NODEBUG);
1067 VERIFY(nvlist_pack(nvl, &packed, &size, NV_ENCODE_NATIVE,
1068 KM_SLEEP) == 0);
1069 if (ddi_copyout(packed, (void *)(uintptr_t)zc->zc_nvlist_dst,
1070 size, zc->zc_iflags) != 0)
1071 error = EFAULT;
1072 kmem_free(packed, size);
1073 }
1074
1075 zc->zc_nvlist_dst_size = size;
1076 return (error);
1077 }
1078
1079 static int
1080 get_zfs_sb(const char *dsname, zfs_sb_t **zsbp)
1081 {
1082 objset_t *os;
1083 int error;
1084
1085 error = dmu_objset_hold(dsname, FTAG, &os);
1086 if (error)
1087 return (error);
1088 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1089 dmu_objset_rele(os, FTAG);
1090 return (EINVAL);
1091 }
1092
1093 mutex_enter(&os->os_user_ptr_lock);
1094 *zsbp = dmu_objset_get_user(os);
1095 if (*zsbp && (*zsbp)->z_sb) {
1096 atomic_inc(&((*zsbp)->z_sb->s_active));
1097 } else {
1098 error = ESRCH;
1099 }
1100 mutex_exit(&os->os_user_ptr_lock);
1101 dmu_objset_rele(os, FTAG);
1102 return (error);
1103 }
1104
1105 /*
1106 * Find a zfs_sb_t for a mounted filesystem, or create our own, in which
1107 * case its z_sb will be NULL, and it will be opened as the owner.
1108 */
1109 static int
1110 zfs_sb_hold(const char *name, void *tag, zfs_sb_t **zsbp, boolean_t writer)
1111 {
1112 int error = 0;
1113
1114 if (get_zfs_sb(name, zsbp) != 0)
1115 error = zfs_sb_create(name, zsbp);
1116 if (error == 0) {
1117 rrw_enter(&(*zsbp)->z_teardown_lock, (writer) ? RW_WRITER :
1118 RW_READER, tag);
1119 if ((*zsbp)->z_unmounted) {
1120 /*
1121 * XXX we could probably try again, since the unmounting
1122 * thread should be just about to disassociate the
1123 * objset from the zfsvfs.
1124 */
1125 rrw_exit(&(*zsbp)->z_teardown_lock, tag);
1126 return (EBUSY);
1127 }
1128 }
1129 return (error);
1130 }
1131
1132 static void
1133 zfs_sb_rele(zfs_sb_t *zsb, void *tag)
1134 {
1135 rrw_exit(&zsb->z_teardown_lock, tag);
1136
1137 if (zsb->z_sb) {
1138 deactivate_super(zsb->z_sb);
1139 } else {
1140 dmu_objset_disown(zsb->z_os, zsb);
1141 zfs_sb_free(zsb);
1142 }
1143 }
1144
1145 static int
1146 zfs_ioc_pool_create(zfs_cmd_t *zc)
1147 {
1148 int error;
1149 nvlist_t *config, *props = NULL;
1150 nvlist_t *rootprops = NULL;
1151 nvlist_t *zplprops = NULL;
1152 char *buf;
1153
1154 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1155 zc->zc_iflags, &config)))
1156 return (error);
1157
1158 if (zc->zc_nvlist_src_size != 0 && (error =
1159 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1160 zc->zc_iflags, &props))) {
1161 nvlist_free(config);
1162 return (error);
1163 }
1164
1165 if (props) {
1166 nvlist_t *nvl = NULL;
1167 uint64_t version = SPA_VERSION;
1168
1169 (void) nvlist_lookup_uint64(props,
1170 zpool_prop_to_name(ZPOOL_PROP_VERSION), &version);
1171 if (version < SPA_VERSION_INITIAL || version > SPA_VERSION) {
1172 error = EINVAL;
1173 goto pool_props_bad;
1174 }
1175 (void) nvlist_lookup_nvlist(props, ZPOOL_ROOTFS_PROPS, &nvl);
1176 if (nvl) {
1177 error = nvlist_dup(nvl, &rootprops, KM_SLEEP);
1178 if (error != 0) {
1179 nvlist_free(config);
1180 nvlist_free(props);
1181 return (error);
1182 }
1183 (void) nvlist_remove_all(props, ZPOOL_ROOTFS_PROPS);
1184 }
1185 VERIFY(nvlist_alloc(&zplprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1186 error = zfs_fill_zplprops_root(version, rootprops,
1187 zplprops, NULL);
1188 if (error)
1189 goto pool_props_bad;
1190 }
1191
1192 buf = history_str_get(zc);
1193
1194 error = spa_create(zc->zc_name, config, props, buf, zplprops);
1195
1196 /*
1197 * Set the remaining root properties
1198 */
1199 if (!error && (error = zfs_set_prop_nvlist(zc->zc_name,
1200 ZPROP_SRC_LOCAL, rootprops, NULL)) != 0)
1201 (void) spa_destroy(zc->zc_name);
1202
1203 if (buf != NULL)
1204 history_str_free(buf);
1205
1206 pool_props_bad:
1207 nvlist_free(rootprops);
1208 nvlist_free(zplprops);
1209 nvlist_free(config);
1210 nvlist_free(props);
1211
1212 return (error);
1213 }
1214
1215 static int
1216 zfs_ioc_pool_destroy(zfs_cmd_t *zc)
1217 {
1218 int error;
1219 zfs_log_history(zc);
1220 error = spa_destroy(zc->zc_name);
1221 if (error == 0)
1222 zvol_remove_minors(zc->zc_name);
1223 return (error);
1224 }
1225
1226 static int
1227 zfs_ioc_pool_import(zfs_cmd_t *zc)
1228 {
1229 nvlist_t *config, *props = NULL;
1230 uint64_t guid;
1231 int error;
1232
1233 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1234 zc->zc_iflags, &config)) != 0)
1235 return (error);
1236
1237 if (zc->zc_nvlist_src_size != 0 && (error =
1238 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1239 zc->zc_iflags, &props))) {
1240 nvlist_free(config);
1241 return (error);
1242 }
1243
1244 if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID, &guid) != 0 ||
1245 guid != zc->zc_guid)
1246 error = EINVAL;
1247 else
1248 error = spa_import(zc->zc_name, config, props, zc->zc_cookie);
1249
1250 if (zc->zc_nvlist_dst != 0) {
1251 int err;
1252
1253 if ((err = put_nvlist(zc, config)) != 0)
1254 error = err;
1255 }
1256
1257 if (error == 0)
1258 zvol_create_minors(zc->zc_name);
1259
1260 nvlist_free(config);
1261
1262 if (props)
1263 nvlist_free(props);
1264
1265 return (error);
1266 }
1267
1268 static int
1269 zfs_ioc_pool_export(zfs_cmd_t *zc)
1270 {
1271 int error;
1272 boolean_t force = (boolean_t)zc->zc_cookie;
1273 boolean_t hardforce = (boolean_t)zc->zc_guid;
1274
1275 zfs_log_history(zc);
1276 error = spa_export(zc->zc_name, NULL, force, hardforce);
1277 if (error == 0)
1278 zvol_remove_minors(zc->zc_name);
1279 return (error);
1280 }
1281
1282 static int
1283 zfs_ioc_pool_configs(zfs_cmd_t *zc)
1284 {
1285 nvlist_t *configs;
1286 int error;
1287
1288 if ((configs = spa_all_configs(&zc->zc_cookie)) == NULL)
1289 return (EEXIST);
1290
1291 error = put_nvlist(zc, configs);
1292
1293 nvlist_free(configs);
1294
1295 return (error);
1296 }
1297
1298 static int
1299 zfs_ioc_pool_stats(zfs_cmd_t *zc)
1300 {
1301 nvlist_t *config;
1302 int error;
1303 int ret = 0;
1304
1305 error = spa_get_stats(zc->zc_name, &config, zc->zc_value,
1306 sizeof (zc->zc_value));
1307
1308 if (config != NULL) {
1309 ret = put_nvlist(zc, config);
1310 nvlist_free(config);
1311
1312 /*
1313 * The config may be present even if 'error' is non-zero.
1314 * In this case we return success, and preserve the real errno
1315 * in 'zc_cookie'.
1316 */
1317 zc->zc_cookie = error;
1318 } else {
1319 ret = error;
1320 }
1321
1322 return (ret);
1323 }
1324
1325 /*
1326 * Try to import the given pool, returning pool stats as appropriate so that
1327 * user land knows which devices are available and overall pool health.
1328 */
1329 static int
1330 zfs_ioc_pool_tryimport(zfs_cmd_t *zc)
1331 {
1332 nvlist_t *tryconfig, *config;
1333 int error;
1334
1335 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1336 zc->zc_iflags, &tryconfig)) != 0)
1337 return (error);
1338
1339 config = spa_tryimport(tryconfig);
1340
1341 nvlist_free(tryconfig);
1342
1343 if (config == NULL)
1344 return (EINVAL);
1345
1346 error = put_nvlist(zc, config);
1347 nvlist_free(config);
1348
1349 return (error);
1350 }
1351
1352 /*
1353 * inputs:
1354 * zc_name name of the pool
1355 * zc_cookie scan func (pool_scan_func_t)
1356 */
1357 static int
1358 zfs_ioc_pool_scan(zfs_cmd_t *zc)
1359 {
1360 spa_t *spa;
1361 int error;
1362
1363 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1364 return (error);
1365
1366 if (zc->zc_cookie == POOL_SCAN_NONE)
1367 error = spa_scan_stop(spa);
1368 else
1369 error = spa_scan(spa, zc->zc_cookie);
1370
1371 spa_close(spa, FTAG);
1372
1373 return (error);
1374 }
1375
1376 static int
1377 zfs_ioc_pool_freeze(zfs_cmd_t *zc)
1378 {
1379 spa_t *spa;
1380 int error;
1381
1382 error = spa_open(zc->zc_name, &spa, FTAG);
1383 if (error == 0) {
1384 spa_freeze(spa);
1385 spa_close(spa, FTAG);
1386 }
1387 return (error);
1388 }
1389
1390 static int
1391 zfs_ioc_pool_upgrade(zfs_cmd_t *zc)
1392 {
1393 spa_t *spa;
1394 int error;
1395
1396 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1397 return (error);
1398
1399 if (zc->zc_cookie < spa_version(spa) || zc->zc_cookie > SPA_VERSION) {
1400 spa_close(spa, FTAG);
1401 return (EINVAL);
1402 }
1403
1404 spa_upgrade(spa, zc->zc_cookie);
1405 spa_close(spa, FTAG);
1406
1407 return (error);
1408 }
1409
1410 static int
1411 zfs_ioc_pool_get_history(zfs_cmd_t *zc)
1412 {
1413 spa_t *spa;
1414 char *hist_buf;
1415 uint64_t size;
1416 int error;
1417
1418 if ((size = zc->zc_history_len) == 0)
1419 return (EINVAL);
1420
1421 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1422 return (error);
1423
1424 if (spa_version(spa) < SPA_VERSION_ZPOOL_HISTORY) {
1425 spa_close(spa, FTAG);
1426 return (ENOTSUP);
1427 }
1428
1429 hist_buf = vmem_alloc(size, KM_SLEEP);
1430 if ((error = spa_history_get(spa, &zc->zc_history_offset,
1431 &zc->zc_history_len, hist_buf)) == 0) {
1432 error = ddi_copyout(hist_buf,
1433 (void *)(uintptr_t)zc->zc_history,
1434 zc->zc_history_len, zc->zc_iflags);
1435 }
1436
1437 spa_close(spa, FTAG);
1438 vmem_free(hist_buf, size);
1439 return (error);
1440 }
1441
1442 static int
1443 zfs_ioc_pool_reguid(zfs_cmd_t *zc)
1444 {
1445 spa_t *spa;
1446 int error;
1447
1448 error = spa_open(zc->zc_name, &spa, FTAG);
1449 if (error == 0) {
1450 error = spa_change_guid(spa);
1451 spa_close(spa, FTAG);
1452 }
1453 return (error);
1454 }
1455
1456 static int
1457 zfs_ioc_dsobj_to_dsname(zfs_cmd_t *zc)
1458 {
1459 int error;
1460
1461 if ((error = dsl_dsobj_to_dsname(zc->zc_name,zc->zc_obj,zc->zc_value)))
1462 return (error);
1463
1464 return (0);
1465 }
1466
1467 /*
1468 * inputs:
1469 * zc_name name of filesystem
1470 * zc_obj object to find
1471 *
1472 * outputs:
1473 * zc_value name of object
1474 */
1475 static int
1476 zfs_ioc_obj_to_path(zfs_cmd_t *zc)
1477 {
1478 objset_t *os;
1479 int error;
1480
1481 /* XXX reading from objset not owned */
1482 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1483 return (error);
1484 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1485 dmu_objset_rele(os, FTAG);
1486 return (EINVAL);
1487 }
1488 error = zfs_obj_to_path(os, zc->zc_obj, zc->zc_value,
1489 sizeof (zc->zc_value));
1490 dmu_objset_rele(os, FTAG);
1491
1492 return (error);
1493 }
1494
1495 /*
1496 * inputs:
1497 * zc_name name of filesystem
1498 * zc_obj object to find
1499 *
1500 * outputs:
1501 * zc_stat stats on object
1502 * zc_value path to object
1503 */
1504 static int
1505 zfs_ioc_obj_to_stats(zfs_cmd_t *zc)
1506 {
1507 objset_t *os;
1508 int error;
1509
1510 /* XXX reading from objset not owned */
1511 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)) != 0)
1512 return (error);
1513 if (dmu_objset_type(os) != DMU_OST_ZFS) {
1514 dmu_objset_rele(os, FTAG);
1515 return (EINVAL);
1516 }
1517 error = zfs_obj_to_stats(os, zc->zc_obj, &zc->zc_stat, zc->zc_value,
1518 sizeof (zc->zc_value));
1519 dmu_objset_rele(os, FTAG);
1520
1521 return (error);
1522 }
1523
1524 static int
1525 zfs_ioc_vdev_add(zfs_cmd_t *zc)
1526 {
1527 spa_t *spa;
1528 int error;
1529 nvlist_t *config, **l2cache, **spares;
1530 uint_t nl2cache = 0, nspares = 0;
1531
1532 error = spa_open(zc->zc_name, &spa, FTAG);
1533 if (error != 0)
1534 return (error);
1535
1536 error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1537 zc->zc_iflags, &config);
1538 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_L2CACHE,
1539 &l2cache, &nl2cache);
1540
1541 (void) nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_SPARES,
1542 &spares, &nspares);
1543
1544 /*
1545 * A root pool with concatenated devices is not supported.
1546 * Thus, can not add a device to a root pool.
1547 *
1548 * Intent log device can not be added to a rootpool because
1549 * during mountroot, zil is replayed, a seperated log device
1550 * can not be accessed during the mountroot time.
1551 *
1552 * l2cache and spare devices are ok to be added to a rootpool.
1553 */
1554 if (spa_bootfs(spa) != 0 && nl2cache == 0 && nspares == 0) {
1555 nvlist_free(config);
1556 spa_close(spa, FTAG);
1557 return (EDOM);
1558 }
1559
1560 if (error == 0) {
1561 error = spa_vdev_add(spa, config);
1562 nvlist_free(config);
1563 }
1564 spa_close(spa, FTAG);
1565 return (error);
1566 }
1567
1568 /*
1569 * inputs:
1570 * zc_name name of the pool
1571 * zc_nvlist_conf nvlist of devices to remove
1572 * zc_cookie to stop the remove?
1573 */
1574 static int
1575 zfs_ioc_vdev_remove(zfs_cmd_t *zc)
1576 {
1577 spa_t *spa;
1578 int error;
1579
1580 error = spa_open(zc->zc_name, &spa, FTAG);
1581 if (error != 0)
1582 return (error);
1583 error = spa_vdev_remove(spa, zc->zc_guid, B_FALSE);
1584 spa_close(spa, FTAG);
1585 return (error);
1586 }
1587
1588 static int
1589 zfs_ioc_vdev_set_state(zfs_cmd_t *zc)
1590 {
1591 spa_t *spa;
1592 int error;
1593 vdev_state_t newstate = VDEV_STATE_UNKNOWN;
1594
1595 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1596 return (error);
1597 switch (zc->zc_cookie) {
1598 case VDEV_STATE_ONLINE:
1599 error = vdev_online(spa, zc->zc_guid, zc->zc_obj, &newstate);
1600 break;
1601
1602 case VDEV_STATE_OFFLINE:
1603 error = vdev_offline(spa, zc->zc_guid, zc->zc_obj);
1604 break;
1605
1606 case VDEV_STATE_FAULTED:
1607 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1608 zc->zc_obj != VDEV_AUX_EXTERNAL)
1609 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1610
1611 error = vdev_fault(spa, zc->zc_guid, zc->zc_obj);
1612 break;
1613
1614 case VDEV_STATE_DEGRADED:
1615 if (zc->zc_obj != VDEV_AUX_ERR_EXCEEDED &&
1616 zc->zc_obj != VDEV_AUX_EXTERNAL)
1617 zc->zc_obj = VDEV_AUX_ERR_EXCEEDED;
1618
1619 error = vdev_degrade(spa, zc->zc_guid, zc->zc_obj);
1620 break;
1621
1622 default:
1623 error = EINVAL;
1624 }
1625 zc->zc_cookie = newstate;
1626 spa_close(spa, FTAG);
1627 return (error);
1628 }
1629
1630 static int
1631 zfs_ioc_vdev_attach(zfs_cmd_t *zc)
1632 {
1633 spa_t *spa;
1634 int replacing = zc->zc_cookie;
1635 nvlist_t *config;
1636 int error;
1637
1638 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1639 return (error);
1640
1641 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1642 zc->zc_iflags, &config)) == 0) {
1643 error = spa_vdev_attach(spa, zc->zc_guid, config, replacing);
1644 nvlist_free(config);
1645 }
1646
1647 spa_close(spa, FTAG);
1648 return (error);
1649 }
1650
1651 static int
1652 zfs_ioc_vdev_detach(zfs_cmd_t *zc)
1653 {
1654 spa_t *spa;
1655 int error;
1656
1657 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1658 return (error);
1659
1660 error = spa_vdev_detach(spa, zc->zc_guid, 0, B_FALSE);
1661
1662 spa_close(spa, FTAG);
1663 return (error);
1664 }
1665
1666 static int
1667 zfs_ioc_vdev_split(zfs_cmd_t *zc)
1668 {
1669 spa_t *spa;
1670 nvlist_t *config, *props = NULL;
1671 int error;
1672 boolean_t exp = !!(zc->zc_cookie & ZPOOL_EXPORT_AFTER_SPLIT);
1673
1674 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
1675 return (error);
1676
1677 if ((error = get_nvlist(zc->zc_nvlist_conf, zc->zc_nvlist_conf_size,
1678 zc->zc_iflags, &config))) {
1679 spa_close(spa, FTAG);
1680 return (error);
1681 }
1682
1683 if (zc->zc_nvlist_src_size != 0 && (error =
1684 get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
1685 zc->zc_iflags, &props))) {
1686 spa_close(spa, FTAG);
1687 nvlist_free(config);
1688 return (error);
1689 }
1690
1691 error = spa_vdev_split_mirror(spa, zc->zc_string, config, props, exp);
1692
1693 spa_close(spa, FTAG);
1694
1695 nvlist_free(config);
1696 nvlist_free(props);
1697
1698 return (error);
1699 }
1700
1701 static int
1702 zfs_ioc_vdev_setpath(zfs_cmd_t *zc)
1703 {
1704 spa_t *spa;
1705 char *path = zc->zc_value;
1706 uint64_t guid = zc->zc_guid;
1707 int error;
1708
1709 error = spa_open(zc->zc_name, &spa, FTAG);
1710 if (error != 0)
1711 return (error);
1712
1713 error = spa_vdev_setpath(spa, guid, path);
1714 spa_close(spa, FTAG);
1715 return (error);
1716 }
1717
1718 static int
1719 zfs_ioc_vdev_setfru(zfs_cmd_t *zc)
1720 {
1721 spa_t *spa;
1722 char *fru = zc->zc_value;
1723 uint64_t guid = zc->zc_guid;
1724 int error;
1725
1726 error = spa_open(zc->zc_name, &spa, FTAG);
1727 if (error != 0)
1728 return (error);
1729
1730 error = spa_vdev_setfru(spa, guid, fru);
1731 spa_close(spa, FTAG);
1732 return (error);
1733 }
1734
1735 static int
1736 zfs_ioc_objset_stats_impl(zfs_cmd_t *zc, objset_t *os)
1737 {
1738 int error = 0;
1739 nvlist_t *nv;
1740
1741 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
1742
1743 if (zc->zc_nvlist_dst != 0 &&
1744 (error = dsl_prop_get_all(os, &nv)) == 0) {
1745 dmu_objset_stats(os, nv);
1746 /*
1747 * NB: zvol_get_stats() will read the objset contents,
1748 * which we aren't supposed to do with a
1749 * DS_MODE_USER hold, because it could be
1750 * inconsistent. So this is a bit of a workaround...
1751 * XXX reading with out owning
1752 */
1753 if (!zc->zc_objset_stats.dds_inconsistent &&
1754 dmu_objset_type(os) == DMU_OST_ZVOL) {
1755 error = zvol_get_stats(os, nv);
1756 if (error == EIO)
1757 return (error);
1758 VERIFY3S(error, ==, 0);
1759 }
1760 if (error == 0)
1761 error = put_nvlist(zc, nv);
1762 nvlist_free(nv);
1763 }
1764
1765 return (error);
1766 }
1767
1768 /*
1769 * inputs:
1770 * zc_name name of filesystem
1771 * zc_nvlist_dst_size size of buffer for property nvlist
1772 *
1773 * outputs:
1774 * zc_objset_stats stats
1775 * zc_nvlist_dst property nvlist
1776 * zc_nvlist_dst_size size of property nvlist
1777 */
1778 static int
1779 zfs_ioc_objset_stats(zfs_cmd_t *zc)
1780 {
1781 objset_t *os = NULL;
1782 int error;
1783
1784 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)))
1785 return (error);
1786
1787 error = zfs_ioc_objset_stats_impl(zc, os);
1788
1789 dmu_objset_rele(os, FTAG);
1790
1791 return (error);
1792 }
1793
1794 /*
1795 * inputs:
1796 * zc_name name of filesystem
1797 * zc_nvlist_dst_size size of buffer for property nvlist
1798 *
1799 * outputs:
1800 * zc_nvlist_dst received property nvlist
1801 * zc_nvlist_dst_size size of received property nvlist
1802 *
1803 * Gets received properties (distinct from local properties on or after
1804 * SPA_VERSION_RECVD_PROPS) for callers who want to differentiate received from
1805 * local property values.
1806 */
1807 static int
1808 zfs_ioc_objset_recvd_props(zfs_cmd_t *zc)
1809 {
1810 objset_t *os = NULL;
1811 int error;
1812 nvlist_t *nv;
1813
1814 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os)))
1815 return (error);
1816
1817 /*
1818 * Without this check, we would return local property values if the
1819 * caller has not already received properties on or after
1820 * SPA_VERSION_RECVD_PROPS.
1821 */
1822 if (!dsl_prop_get_hasrecvd(os)) {
1823 dmu_objset_rele(os, FTAG);
1824 return (ENOTSUP);
1825 }
1826
1827 if (zc->zc_nvlist_dst != 0 &&
1828 (error = dsl_prop_get_received(os, &nv)) == 0) {
1829 error = put_nvlist(zc, nv);
1830 nvlist_free(nv);
1831 }
1832
1833 dmu_objset_rele(os, FTAG);
1834 return (error);
1835 }
1836
1837 static int
1838 nvl_add_zplprop(objset_t *os, nvlist_t *props, zfs_prop_t prop)
1839 {
1840 uint64_t value;
1841 int error;
1842
1843 /*
1844 * zfs_get_zplprop() will either find a value or give us
1845 * the default value (if there is one).
1846 */
1847 if ((error = zfs_get_zplprop(os, prop, &value)) != 0)
1848 return (error);
1849 VERIFY(nvlist_add_uint64(props, zfs_prop_to_name(prop), value) == 0);
1850 return (0);
1851 }
1852
1853 /*
1854 * inputs:
1855 * zc_name name of filesystem
1856 * zc_nvlist_dst_size size of buffer for zpl property nvlist
1857 *
1858 * outputs:
1859 * zc_nvlist_dst zpl property nvlist
1860 * zc_nvlist_dst_size size of zpl property nvlist
1861 */
1862 static int
1863 zfs_ioc_objset_zplprops(zfs_cmd_t *zc)
1864 {
1865 objset_t *os;
1866 int err;
1867
1868 /* XXX reading without owning */
1869 if ((err = dmu_objset_hold(zc->zc_name, FTAG, &os)))
1870 return (err);
1871
1872 dmu_objset_fast_stat(os, &zc->zc_objset_stats);
1873
1874 /*
1875 * NB: nvl_add_zplprop() will read the objset contents,
1876 * which we aren't supposed to do with a DS_MODE_USER
1877 * hold, because it could be inconsistent.
1878 */
1879 if (zc->zc_nvlist_dst != 0 &&
1880 !zc->zc_objset_stats.dds_inconsistent &&
1881 dmu_objset_type(os) == DMU_OST_ZFS) {
1882 nvlist_t *nv;
1883
1884 VERIFY(nvlist_alloc(&nv, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1885 if ((err = nvl_add_zplprop(os, nv, ZFS_PROP_VERSION)) == 0 &&
1886 (err = nvl_add_zplprop(os, nv, ZFS_PROP_NORMALIZE)) == 0 &&
1887 (err = nvl_add_zplprop(os, nv, ZFS_PROP_UTF8ONLY)) == 0 &&
1888 (err = nvl_add_zplprop(os, nv, ZFS_PROP_CASE)) == 0)
1889 err = put_nvlist(zc, nv);
1890 nvlist_free(nv);
1891 } else {
1892 err = ENOENT;
1893 }
1894 dmu_objset_rele(os, FTAG);
1895 return (err);
1896 }
1897
1898 static boolean_t
1899 dataset_name_hidden(const char *name)
1900 {
1901 /*
1902 * Skip over datasets that are not visible in this zone,
1903 * internal datasets (which have a $ in their name), and
1904 * temporary datasets (which have a % in their name).
1905 */
1906 if (strchr(name, '$') != NULL)
1907 return (B_TRUE);
1908 if (strchr(name, '%') != NULL)
1909 return (B_TRUE);
1910 if (!INGLOBALZONE(curproc) && !zone_dataset_visible(name, NULL))
1911 return (B_TRUE);
1912 return (B_FALSE);
1913 }
1914
1915 /*
1916 * inputs:
1917 * zc_name name of filesystem
1918 * zc_cookie zap cursor
1919 * zc_nvlist_dst_size size of buffer for property nvlist
1920 *
1921 * outputs:
1922 * zc_name name of next filesystem
1923 * zc_cookie zap cursor
1924 * zc_objset_stats stats
1925 * zc_nvlist_dst property nvlist
1926 * zc_nvlist_dst_size size of property nvlist
1927 */
1928 static int
1929 zfs_ioc_dataset_list_next(zfs_cmd_t *zc)
1930 {
1931 objset_t *os;
1932 int error;
1933 char *p;
1934 size_t orig_len = strlen(zc->zc_name);
1935
1936 top:
1937 if ((error = dmu_objset_hold(zc->zc_name, FTAG, &os))) {
1938 if (error == ENOENT)
1939 error = ESRCH;
1940 return (error);
1941 }
1942
1943 p = strrchr(zc->zc_name, '/');
1944 if (p == NULL || p[1] != '\0')
1945 (void) strlcat(zc->zc_name, "/", sizeof (zc->zc_name));
1946 p = zc->zc_name + strlen(zc->zc_name);
1947
1948 /*
1949 * Pre-fetch the datasets. dmu_objset_prefetch() always returns 0
1950 * but is not declared void because its called by dmu_objset_find().
1951 */
1952 if (zc->zc_cookie == 0) {
1953 uint64_t cookie = 0;
1954 int len = sizeof (zc->zc_name) - (p - zc->zc_name);
1955
1956 while (dmu_dir_list_next(os, len, p, NULL, &cookie) == 0) {
1957 if (!dataset_name_hidden(zc->zc_name))
1958 (void) dmu_objset_prefetch(zc->zc_name, NULL);
1959 }
1960 }
1961
1962 do {
1963 error = dmu_dir_list_next(os,
1964 sizeof (zc->zc_name) - (p - zc->zc_name), p,
1965 NULL, &zc->zc_cookie);
1966 if (error == ENOENT)
1967 error = ESRCH;
1968 } while (error == 0 && dataset_name_hidden(zc->zc_name));
1969 dmu_objset_rele(os, FTAG);
1970
1971 /*
1972 * If it's an internal dataset (ie. with a '$' in its name),
1973 * don't try to get stats for it, otherwise we'll return ENOENT.
1974 */
1975 if (error == 0 && strchr(zc->zc_name, '$') == NULL) {
1976 error = zfs_ioc_objset_stats(zc); /* fill in the stats */
1977 if (error == ENOENT) {
1978 /* We lost a race with destroy, get the next one. */
1979 zc->zc_name[orig_len] = '\0';
1980 goto top;
1981 }
1982 }
1983 return (error);
1984 }
1985
1986 /*
1987 * inputs:
1988 * zc_name name of filesystem
1989 * zc_cookie zap cursor
1990 * zc_nvlist_dst_size size of buffer for property nvlist
1991 *
1992 * outputs:
1993 * zc_name name of next snapshot
1994 * zc_objset_stats stats
1995 * zc_nvlist_dst property nvlist
1996 * zc_nvlist_dst_size size of property nvlist
1997 */
1998 static int
1999 zfs_ioc_snapshot_list_next(zfs_cmd_t *zc)
2000 {
2001 objset_t *os;
2002 int error;
2003
2004 top:
2005 if (zc->zc_cookie == 0 && !zc->zc_simple)
2006 (void) dmu_objset_find(zc->zc_name, dmu_objset_prefetch,
2007 NULL, DS_FIND_SNAPSHOTS);
2008
2009 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
2010 if (error)
2011 return (error == ENOENT ? ESRCH : error);
2012
2013 /*
2014 * A dataset name of maximum length cannot have any snapshots,
2015 * so exit immediately.
2016 */
2017 if (strlcat(zc->zc_name, "@", sizeof (zc->zc_name)) >= MAXNAMELEN) {
2018 dmu_objset_rele(os, FTAG);
2019 return (ESRCH);
2020 }
2021
2022 error = dmu_snapshot_list_next(os,
2023 sizeof (zc->zc_name) - strlen(zc->zc_name),
2024 zc->zc_name + strlen(zc->zc_name), &zc->zc_obj, &zc->zc_cookie,
2025 NULL);
2026
2027 if (error == 0 && !zc->zc_simple) {
2028 dsl_dataset_t *ds;
2029 dsl_pool_t *dp = os->os_dsl_dataset->ds_dir->dd_pool;
2030
2031 /*
2032 * Since we probably don't have a hold on this snapshot,
2033 * it's possible that the objsetid could have been destroyed
2034 * and reused for a new objset. It's OK if this happens during
2035 * a zfs send operation, since the new createtxg will be
2036 * beyond the range we're interested in.
2037 */
2038 rw_enter(&dp->dp_config_rwlock, RW_READER);
2039 error = dsl_dataset_hold_obj(dp, zc->zc_obj, FTAG, &ds);
2040 rw_exit(&dp->dp_config_rwlock);
2041 if (error) {
2042 if (error == ENOENT) {
2043 /* Racing with destroy, get the next one. */
2044 *strchr(zc->zc_name, '@') = '\0';
2045 dmu_objset_rele(os, FTAG);
2046 goto top;
2047 }
2048 } else {
2049 objset_t *ossnap;
2050
2051 error = dmu_objset_from_ds(ds, &ossnap);
2052 if (error == 0)
2053 error = zfs_ioc_objset_stats_impl(zc, ossnap);
2054 dsl_dataset_rele(ds, FTAG);
2055 }
2056 } else if (error == ENOENT) {
2057 error = ESRCH;
2058 }
2059
2060 dmu_objset_rele(os, FTAG);
2061 /* if we failed, undo the @ that we tacked on to zc_name */
2062 if (error)
2063 *strchr(zc->zc_name, '@') = '\0';
2064 return (error);
2065 }
2066
2067 static int
2068 zfs_prop_set_userquota(const char *dsname, nvpair_t *pair)
2069 {
2070 const char *propname = nvpair_name(pair);
2071 uint64_t *valary;
2072 unsigned int vallen;
2073 const char *domain;
2074 char *dash;
2075 zfs_userquota_prop_t type;
2076 uint64_t rid;
2077 uint64_t quota;
2078 zfs_sb_t *zsb;
2079 int err;
2080
2081 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2082 nvlist_t *attrs;
2083 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2084 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2085 &pair) != 0)
2086 return (EINVAL);
2087 }
2088
2089 /*
2090 * A correctly constructed propname is encoded as
2091 * userquota@<rid>-<domain>.
2092 */
2093 if ((dash = strchr(propname, '-')) == NULL ||
2094 nvpair_value_uint64_array(pair, &valary, &vallen) != 0 ||
2095 vallen != 3)
2096 return (EINVAL);
2097
2098 domain = dash + 1;
2099 type = valary[0];
2100 rid = valary[1];
2101 quota = valary[2];
2102
2103 err = zfs_sb_hold(dsname, FTAG, &zsb, B_FALSE);
2104 if (err == 0) {
2105 err = zfs_set_userquota(zsb, type, domain, rid, quota);
2106 zfs_sb_rele(zsb, FTAG);
2107 }
2108
2109 return (err);
2110 }
2111
2112 /*
2113 * If the named property is one that has a special function to set its value,
2114 * return 0 on success and a positive error code on failure; otherwise if it is
2115 * not one of the special properties handled by this function, return -1.
2116 *
2117 * XXX: It would be better for callers of the property interface if we handled
2118 * these special cases in dsl_prop.c (in the dsl layer).
2119 */
2120 static int
2121 zfs_prop_set_special(const char *dsname, zprop_source_t source,
2122 nvpair_t *pair)
2123 {
2124 const char *propname = nvpair_name(pair);
2125 zfs_prop_t prop = zfs_name_to_prop(propname);
2126 uint64_t intval;
2127 int err;
2128
2129 if (prop == ZPROP_INVAL) {
2130 if (zfs_prop_userquota(propname))
2131 return (zfs_prop_set_userquota(dsname, pair));
2132 return (-1);
2133 }
2134
2135 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2136 nvlist_t *attrs;
2137 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2138 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2139 &pair) == 0);
2140 }
2141
2142 if (zfs_prop_get_type(prop) == PROP_TYPE_STRING)
2143 return (-1);
2144
2145 VERIFY(0 == nvpair_value_uint64(pair, &intval));
2146
2147 switch (prop) {
2148 case ZFS_PROP_QUOTA:
2149 err = dsl_dir_set_quota(dsname, source, intval);
2150 break;
2151 case ZFS_PROP_REFQUOTA:
2152 err = dsl_dataset_set_quota(dsname, source, intval);
2153 break;
2154 case ZFS_PROP_RESERVATION:
2155 err = dsl_dir_set_reservation(dsname, source, intval);
2156 break;
2157 case ZFS_PROP_REFRESERVATION:
2158 err = dsl_dataset_set_reservation(dsname, source, intval);
2159 break;
2160 case ZFS_PROP_VOLSIZE:
2161 err = zvol_set_volsize(dsname, intval);
2162 break;
2163 case ZFS_PROP_VERSION:
2164 {
2165 zfs_sb_t *zsb;
2166
2167 if ((err = zfs_sb_hold(dsname, FTAG, &zsb, B_TRUE)) != 0)
2168 break;
2169
2170 err = zfs_set_version(zsb, intval);
2171 zfs_sb_rele(zsb, FTAG);
2172
2173 if (err == 0 && intval >= ZPL_VERSION_USERSPACE) {
2174 zfs_cmd_t *zc;
2175
2176 zc = kmem_zalloc(sizeof (zfs_cmd_t),
2177 KM_SLEEP | KM_NODEBUG);
2178 (void) strcpy(zc->zc_name, dsname);
2179 (void) zfs_ioc_userspace_upgrade(zc);
2180 kmem_free(zc, sizeof (zfs_cmd_t));
2181 }
2182 break;
2183 }
2184
2185 default:
2186 err = -1;
2187 }
2188
2189 return (err);
2190 }
2191
2192 /*
2193 * This function is best effort. If it fails to set any of the given properties,
2194 * it continues to set as many as it can and returns the first error
2195 * encountered. If the caller provides a non-NULL errlist, it also gives the
2196 * complete list of names of all the properties it failed to set along with the
2197 * corresponding error numbers. The caller is responsible for freeing the
2198 * returned errlist.
2199 *
2200 * If every property is set successfully, zero is returned and the list pointed
2201 * at by errlist is NULL.
2202 */
2203 int
2204 zfs_set_prop_nvlist(const char *dsname, zprop_source_t source, nvlist_t *nvl,
2205 nvlist_t **errlist)
2206 {
2207 nvpair_t *pair;
2208 nvpair_t *propval;
2209 int rv = 0;
2210 uint64_t intval;
2211 char *strval;
2212 nvlist_t *genericnvl;
2213 nvlist_t *errors;
2214 nvlist_t *retrynvl;
2215
2216 VERIFY(nvlist_alloc(&genericnvl, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2217 VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2218 VERIFY(nvlist_alloc(&retrynvl, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2219
2220 retry:
2221 pair = NULL;
2222 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2223 const char *propname = nvpair_name(pair);
2224 zfs_prop_t prop = zfs_name_to_prop(propname);
2225 int err = 0;
2226
2227 /* decode the property value */
2228 propval = pair;
2229 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2230 nvlist_t *attrs;
2231 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2232 if (nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2233 &propval) != 0)
2234 err = EINVAL;
2235 }
2236
2237 /* Validate value type */
2238 if (err == 0 && prop == ZPROP_INVAL) {
2239 if (zfs_prop_user(propname)) {
2240 if (nvpair_type(propval) != DATA_TYPE_STRING)
2241 err = EINVAL;
2242 } else if (zfs_prop_userquota(propname)) {
2243 if (nvpair_type(propval) !=
2244 DATA_TYPE_UINT64_ARRAY)
2245 err = EINVAL;
2246 } else {
2247 err = EINVAL;
2248 }
2249 } else if (err == 0) {
2250 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2251 if (zfs_prop_get_type(prop) != PROP_TYPE_STRING)
2252 err = EINVAL;
2253 } else if (nvpair_type(propval) == DATA_TYPE_UINT64) {
2254 const char *unused;
2255
2256 VERIFY(nvpair_value_uint64(propval,
2257 &intval) == 0);
2258
2259 switch (zfs_prop_get_type(prop)) {
2260 case PROP_TYPE_NUMBER:
2261 break;
2262 case PROP_TYPE_STRING:
2263 err = EINVAL;
2264 break;
2265 case PROP_TYPE_INDEX:
2266 if (zfs_prop_index_to_string(prop,
2267 intval, &unused) != 0)
2268 err = EINVAL;
2269 break;
2270 default:
2271 cmn_err(CE_PANIC,
2272 "unknown property type");
2273 }
2274 } else {
2275 err = EINVAL;
2276 }
2277 }
2278
2279 /* Validate permissions */
2280 if (err == 0)
2281 err = zfs_check_settable(dsname, pair, CRED());
2282
2283 if (err == 0) {
2284 err = zfs_prop_set_special(dsname, source, pair);
2285 if (err == -1) {
2286 /*
2287 * For better performance we build up a list of
2288 * properties to set in a single transaction.
2289 */
2290 err = nvlist_add_nvpair(genericnvl, pair);
2291 } else if (err != 0 && nvl != retrynvl) {
2292 /*
2293 * This may be a spurious error caused by
2294 * receiving quota and reservation out of order.
2295 * Try again in a second pass.
2296 */
2297 err = nvlist_add_nvpair(retrynvl, pair);
2298 }
2299 }
2300
2301 if (err != 0)
2302 VERIFY(nvlist_add_int32(errors, propname, err) == 0);
2303 }
2304
2305 if (nvl != retrynvl && !nvlist_empty(retrynvl)) {
2306 nvl = retrynvl;
2307 goto retry;
2308 }
2309
2310 if (!nvlist_empty(genericnvl) &&
2311 dsl_props_set(dsname, source, genericnvl) != 0) {
2312 /*
2313 * If this fails, we still want to set as many properties as we
2314 * can, so try setting them individually.
2315 */
2316 pair = NULL;
2317 while ((pair = nvlist_next_nvpair(genericnvl, pair)) != NULL) {
2318 const char *propname = nvpair_name(pair);
2319 int err = 0;
2320
2321 propval = pair;
2322 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
2323 nvlist_t *attrs;
2324 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
2325 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
2326 &propval) == 0);
2327 }
2328
2329 if (nvpair_type(propval) == DATA_TYPE_STRING) {
2330 VERIFY(nvpair_value_string(propval,
2331 &strval) == 0);
2332 err = dsl_prop_set(dsname, propname, source, 1,
2333 strlen(strval) + 1, strval);
2334 } else {
2335 VERIFY(nvpair_value_uint64(propval,
2336 &intval) == 0);
2337 err = dsl_prop_set(dsname, propname, source, 8,
2338 1, &intval);
2339 }
2340
2341 if (err != 0) {
2342 VERIFY(nvlist_add_int32(errors, propname,
2343 err) == 0);
2344 }
2345 }
2346 }
2347 nvlist_free(genericnvl);
2348 nvlist_free(retrynvl);
2349
2350 if ((pair = nvlist_next_nvpair(errors, NULL)) == NULL) {
2351 nvlist_free(errors);
2352 errors = NULL;
2353 } else {
2354 VERIFY(nvpair_value_int32(pair, &rv) == 0);
2355 }
2356
2357 if (errlist == NULL)
2358 nvlist_free(errors);
2359 else
2360 *errlist = errors;
2361
2362 return (rv);
2363 }
2364
2365 /*
2366 * Check that all the properties are valid user properties.
2367 */
2368 static int
2369 zfs_check_userprops(char *fsname, nvlist_t *nvl)
2370 {
2371 nvpair_t *pair = NULL;
2372 int error = 0;
2373
2374 while ((pair = nvlist_next_nvpair(nvl, pair)) != NULL) {
2375 const char *propname = nvpair_name(pair);
2376 char *valstr;
2377
2378 if (!zfs_prop_user(propname) ||
2379 nvpair_type(pair) != DATA_TYPE_STRING)
2380 return (EINVAL);
2381
2382 if ((error = zfs_secpolicy_write_perms(fsname,
2383 ZFS_DELEG_PERM_USERPROP, CRED())))
2384 return (error);
2385
2386 if (strlen(propname) >= ZAP_MAXNAMELEN)
2387 return (ENAMETOOLONG);
2388
2389 VERIFY(nvpair_value_string(pair, &valstr) == 0);
2390 if (strlen(valstr) >= ZAP_MAXVALUELEN)
2391 return (E2BIG);
2392 }
2393 return (0);
2394 }
2395
2396 static void
2397 props_skip(nvlist_t *props, nvlist_t *skipped, nvlist_t **newprops)
2398 {
2399 nvpair_t *pair;
2400
2401 VERIFY(nvlist_alloc(newprops, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2402
2403 pair = NULL;
2404 while ((pair = nvlist_next_nvpair(props, pair)) != NULL) {
2405 if (nvlist_exists(skipped, nvpair_name(pair)))
2406 continue;
2407
2408 VERIFY(nvlist_add_nvpair(*newprops, pair) == 0);
2409 }
2410 }
2411
2412 static int
2413 clear_received_props(objset_t *os, const char *fs, nvlist_t *props,
2414 nvlist_t *skipped)
2415 {
2416 int err = 0;
2417 nvlist_t *cleared_props = NULL;
2418 props_skip(props, skipped, &cleared_props);
2419 if (!nvlist_empty(cleared_props)) {
2420 /*
2421 * Acts on local properties until the dataset has received
2422 * properties at least once on or after SPA_VERSION_RECVD_PROPS.
2423 */
2424 zprop_source_t flags = (ZPROP_SRC_NONE |
2425 (dsl_prop_get_hasrecvd(os) ? ZPROP_SRC_RECEIVED : 0));
2426 err = zfs_set_prop_nvlist(fs, flags, cleared_props, NULL);
2427 }
2428 nvlist_free(cleared_props);
2429 return (err);
2430 }
2431
2432 /*
2433 * inputs:
2434 * zc_name name of filesystem
2435 * zc_value name of property to set
2436 * zc_nvlist_src{_size} nvlist of properties to apply
2437 * zc_cookie received properties flag
2438 *
2439 * outputs:
2440 * zc_nvlist_dst{_size} error for each unapplied received property
2441 */
2442 static int
2443 zfs_ioc_set_prop(zfs_cmd_t *zc)
2444 {
2445 nvlist_t *nvl;
2446 boolean_t received = zc->zc_cookie;
2447 zprop_source_t source = (received ? ZPROP_SRC_RECEIVED :
2448 ZPROP_SRC_LOCAL);
2449 nvlist_t *errors = NULL;
2450 int error;
2451
2452 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2453 zc->zc_iflags, &nvl)) != 0)
2454 return (error);
2455
2456 if (received) {
2457 nvlist_t *origprops;
2458 objset_t *os;
2459
2460 if (dmu_objset_hold(zc->zc_name, FTAG, &os) == 0) {
2461 if (dsl_prop_get_received(os, &origprops) == 0) {
2462 (void) clear_received_props(os,
2463 zc->zc_name, origprops, nvl);
2464 nvlist_free(origprops);
2465 }
2466
2467 dsl_prop_set_hasrecvd(os);
2468 dmu_objset_rele(os, FTAG);
2469 }
2470 }
2471
2472 error = zfs_set_prop_nvlist(zc->zc_name, source, nvl, &errors);
2473
2474 if (zc->zc_nvlist_dst != 0 && errors != NULL) {
2475 (void) put_nvlist(zc, errors);
2476 }
2477
2478 nvlist_free(errors);
2479 nvlist_free(nvl);
2480 return (error);
2481 }
2482
2483 /*
2484 * inputs:
2485 * zc_name name of filesystem
2486 * zc_value name of property to inherit
2487 * zc_cookie revert to received value if TRUE
2488 *
2489 * outputs: none
2490 */
2491 static int
2492 zfs_ioc_inherit_prop(zfs_cmd_t *zc)
2493 {
2494 const char *propname = zc->zc_value;
2495 zfs_prop_t prop = zfs_name_to_prop(propname);
2496 boolean_t received = zc->zc_cookie;
2497 zprop_source_t source = (received
2498 ? ZPROP_SRC_NONE /* revert to received value, if any */
2499 : ZPROP_SRC_INHERITED); /* explicitly inherit */
2500
2501 if (received) {
2502 nvlist_t *dummy;
2503 nvpair_t *pair;
2504 zprop_type_t type;
2505 int err;
2506
2507 /*
2508 * zfs_prop_set_special() expects properties in the form of an
2509 * nvpair with type info.
2510 */
2511 if (prop == ZPROP_INVAL) {
2512 if (!zfs_prop_user(propname))
2513 return (EINVAL);
2514
2515 type = PROP_TYPE_STRING;
2516 } else if (prop == ZFS_PROP_VOLSIZE ||
2517 prop == ZFS_PROP_VERSION) {
2518 return (EINVAL);
2519 } else {
2520 type = zfs_prop_get_type(prop);
2521 }
2522
2523 VERIFY(nvlist_alloc(&dummy, NV_UNIQUE_NAME, KM_SLEEP) == 0);
2524
2525 switch (type) {
2526 case PROP_TYPE_STRING:
2527 VERIFY(0 == nvlist_add_string(dummy, propname, ""));
2528 break;
2529 case PROP_TYPE_NUMBER:
2530 case PROP_TYPE_INDEX:
2531 VERIFY(0 == nvlist_add_uint64(dummy, propname, 0));
2532 break;
2533 default:
2534 nvlist_free(dummy);
2535 return (EINVAL);
2536 }
2537
2538 pair = nvlist_next_nvpair(dummy, NULL);
2539 err = zfs_prop_set_special(zc->zc_name, source, pair);
2540 nvlist_free(dummy);
2541 if (err != -1)
2542 return (err); /* special property already handled */
2543 } else {
2544 /*
2545 * Only check this in the non-received case. We want to allow
2546 * 'inherit -S' to revert non-inheritable properties like quota
2547 * and reservation to the received or default values even though
2548 * they are not considered inheritable.
2549 */
2550 if (prop != ZPROP_INVAL && !zfs_prop_inheritable(prop))
2551 return (EINVAL);
2552 }
2553
2554 /* the property name has been validated by zfs_secpolicy_inherit() */
2555 return (dsl_prop_set(zc->zc_name, zc->zc_value, source, 0, 0, NULL));
2556 }
2557
2558 static int
2559 zfs_ioc_pool_set_props(zfs_cmd_t *zc)
2560 {
2561 nvlist_t *props;
2562 spa_t *spa;
2563 int error;
2564 nvpair_t *pair;
2565
2566 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2567 zc->zc_iflags, &props)))
2568 return (error);
2569
2570 /*
2571 * If the only property is the configfile, then just do a spa_lookup()
2572 * to handle the faulted case.
2573 */
2574 pair = nvlist_next_nvpair(props, NULL);
2575 if (pair != NULL && strcmp(nvpair_name(pair),
2576 zpool_prop_to_name(ZPOOL_PROP_CACHEFILE)) == 0 &&
2577 nvlist_next_nvpair(props, pair) == NULL) {
2578 mutex_enter(&spa_namespace_lock);
2579 if ((spa = spa_lookup(zc->zc_name)) != NULL) {
2580 spa_configfile_set(spa, props, B_FALSE);
2581 spa_config_sync(spa, B_FALSE, B_TRUE);
2582 }
2583 mutex_exit(&spa_namespace_lock);
2584 if (spa != NULL) {
2585 nvlist_free(props);
2586 return (0);
2587 }
2588 }
2589
2590 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2591 nvlist_free(props);
2592 return (error);
2593 }
2594
2595 error = spa_prop_set(spa, props);
2596
2597 nvlist_free(props);
2598 spa_close(spa, FTAG);
2599
2600 return (error);
2601 }
2602
2603 static int
2604 zfs_ioc_pool_get_props(zfs_cmd_t *zc)
2605 {
2606 spa_t *spa;
2607 int error;
2608 nvlist_t *nvp = NULL;
2609
2610 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0) {
2611 /*
2612 * If the pool is faulted, there may be properties we can still
2613 * get (such as altroot and cachefile), so attempt to get them
2614 * anyway.
2615 */
2616 mutex_enter(&spa_namespace_lock);
2617 if ((spa = spa_lookup(zc->zc_name)) != NULL)
2618 error = spa_prop_get(spa, &nvp);
2619 mutex_exit(&spa_namespace_lock);
2620 } else {
2621 error = spa_prop_get(spa, &nvp);
2622 spa_close(spa, FTAG);
2623 }
2624
2625 if (error == 0 && zc->zc_nvlist_dst != 0)
2626 error = put_nvlist(zc, nvp);
2627 else
2628 error = EFAULT;
2629
2630 nvlist_free(nvp);
2631 return (error);
2632 }
2633
2634 /*
2635 * inputs:
2636 * zc_name name of volume
2637 *
2638 * outputs: none
2639 */
2640 static int
2641 zfs_ioc_create_minor(zfs_cmd_t *zc)
2642 {
2643 return (zvol_create_minor(zc->zc_name));
2644 }
2645
2646 /*
2647 * inputs:
2648 * zc_name name of volume
2649 *
2650 * outputs: none
2651 */
2652 static int
2653 zfs_ioc_remove_minor(zfs_cmd_t *zc)
2654 {
2655 return (zvol_remove_minor(zc->zc_name));
2656 }
2657
2658 /*
2659 * inputs:
2660 * zc_name name of filesystem
2661 * zc_nvlist_src{_size} nvlist of delegated permissions
2662 * zc_perm_action allow/unallow flag
2663 *
2664 * outputs: none
2665 */
2666 static int
2667 zfs_ioc_set_fsacl(zfs_cmd_t *zc)
2668 {
2669 int error;
2670 nvlist_t *fsaclnv = NULL;
2671
2672 if ((error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2673 zc->zc_iflags, &fsaclnv)) != 0)
2674 return (error);
2675
2676 /*
2677 * Verify nvlist is constructed correctly
2678 */
2679 if ((error = zfs_deleg_verify_nvlist(fsaclnv)) != 0) {
2680 nvlist_free(fsaclnv);
2681 return (EINVAL);
2682 }
2683
2684 /*
2685 * If we don't have PRIV_SYS_MOUNT, then validate
2686 * that user is allowed to hand out each permission in
2687 * the nvlist(s)
2688 */
2689
2690 error = secpolicy_zfs(CRED());
2691 if (error) {
2692 if (zc->zc_perm_action == B_FALSE) {
2693 error = dsl_deleg_can_allow(zc->zc_name,
2694 fsaclnv, CRED());
2695 } else {
2696 error = dsl_deleg_can_unallow(zc->zc_name,
2697 fsaclnv, CRED());
2698 }
2699 }
2700
2701 if (error == 0)
2702 error = dsl_deleg_set(zc->zc_name, fsaclnv, zc->zc_perm_action);
2703
2704 nvlist_free(fsaclnv);
2705 return (error);
2706 }
2707
2708 /*
2709 * inputs:
2710 * zc_name name of filesystem
2711 *
2712 * outputs:
2713 * zc_nvlist_src{_size} nvlist of delegated permissions
2714 */
2715 static int
2716 zfs_ioc_get_fsacl(zfs_cmd_t *zc)
2717 {
2718 nvlist_t *nvp;
2719 int error;
2720
2721 if ((error = dsl_deleg_get(zc->zc_name, &nvp)) == 0) {
2722 error = put_nvlist(zc, nvp);
2723 nvlist_free(nvp);
2724 }
2725
2726 return (error);
2727 }
2728
2729 /* ARGSUSED */
2730 static void
2731 zfs_create_cb(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx)
2732 {
2733 zfs_creat_t *zct = arg;
2734
2735 zfs_create_fs(os, cr, zct->zct_zplprops, tx);
2736 }
2737
2738 #define ZFS_PROP_UNDEFINED ((uint64_t)-1)
2739
2740 /*
2741 * inputs:
2742 * createprops list of properties requested by creator
2743 * default_zplver zpl version to use if unspecified in createprops
2744 * fuids_ok fuids allowed in this version of the spa?
2745 * os parent objset pointer (NULL if root fs)
2746 *
2747 * outputs:
2748 * zplprops values for the zplprops we attach to the master node object
2749 * is_ci true if requested file system will be purely case-insensitive
2750 *
2751 * Determine the settings for utf8only, normalization and
2752 * casesensitivity. Specific values may have been requested by the
2753 * creator and/or we can inherit values from the parent dataset. If
2754 * the file system is of too early a vintage, a creator can not
2755 * request settings for these properties, even if the requested
2756 * setting is the default value. We don't actually want to create dsl
2757 * properties for these, so remove them from the source nvlist after
2758 * processing.
2759 */
2760 static int
2761 zfs_fill_zplprops_impl(objset_t *os, uint64_t zplver,
2762 boolean_t fuids_ok, boolean_t sa_ok, nvlist_t *createprops,
2763 nvlist_t *zplprops, boolean_t *is_ci)
2764 {
2765 uint64_t sense = ZFS_PROP_UNDEFINED;
2766 uint64_t norm = ZFS_PROP_UNDEFINED;
2767 uint64_t u8 = ZFS_PROP_UNDEFINED;
2768 int error;
2769
2770 ASSERT(zplprops != NULL);
2771
2772 /*
2773 * Pull out creator prop choices, if any.
2774 */
2775 if (createprops) {
2776 (void) nvlist_lookup_uint64(createprops,
2777 zfs_prop_to_name(ZFS_PROP_VERSION), &zplver);
2778 (void) nvlist_lookup_uint64(createprops,
2779 zfs_prop_to_name(ZFS_PROP_NORMALIZE), &norm);
2780 (void) nvlist_remove_all(createprops,
2781 zfs_prop_to_name(ZFS_PROP_NORMALIZE));
2782 (void) nvlist_lookup_uint64(createprops,
2783 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), &u8);
2784 (void) nvlist_remove_all(createprops,
2785 zfs_prop_to_name(ZFS_PROP_UTF8ONLY));
2786 (void) nvlist_lookup_uint64(createprops,
2787 zfs_prop_to_name(ZFS_PROP_CASE), &sense);
2788 (void) nvlist_remove_all(createprops,
2789 zfs_prop_to_name(ZFS_PROP_CASE));
2790 }
2791
2792 /*
2793 * If the zpl version requested is whacky or the file system
2794 * or pool is version is too "young" to support normalization
2795 * and the creator tried to set a value for one of the props,
2796 * error out.
2797 */
2798 if ((zplver < ZPL_VERSION_INITIAL || zplver > ZPL_VERSION) ||
2799 (zplver >= ZPL_VERSION_FUID && !fuids_ok) ||
2800 (zplver >= ZPL_VERSION_SA && !sa_ok) ||
2801 (zplver < ZPL_VERSION_NORMALIZATION &&
2802 (norm != ZFS_PROP_UNDEFINED || u8 != ZFS_PROP_UNDEFINED ||
2803 sense != ZFS_PROP_UNDEFINED)))
2804 return (ENOTSUP);
2805
2806 /*
2807 * Put the version in the zplprops
2808 */
2809 VERIFY(nvlist_add_uint64(zplprops,
2810 zfs_prop_to_name(ZFS_PROP_VERSION), zplver) == 0);
2811
2812 if (norm == ZFS_PROP_UNDEFINED &&
2813 (error = zfs_get_zplprop(os, ZFS_PROP_NORMALIZE, &norm)) != 0)
2814 return (error);
2815 VERIFY(nvlist_add_uint64(zplprops,
2816 zfs_prop_to_name(ZFS_PROP_NORMALIZE), norm) == 0);
2817
2818 /*
2819 * If we're normalizing, names must always be valid UTF-8 strings.
2820 */
2821 if (norm)
2822 u8 = 1;
2823 if (u8 == ZFS_PROP_UNDEFINED &&
2824 (error = zfs_get_zplprop(os, ZFS_PROP_UTF8ONLY, &u8)) != 0)
2825 return (error);
2826 VERIFY(nvlist_add_uint64(zplprops,
2827 zfs_prop_to_name(ZFS_PROP_UTF8ONLY), u8) == 0);
2828
2829 if (sense == ZFS_PROP_UNDEFINED &&
2830 (error = zfs_get_zplprop(os, ZFS_PROP_CASE, &sense)) != 0)
2831 return (error);
2832 VERIFY(nvlist_add_uint64(zplprops,
2833 zfs_prop_to_name(ZFS_PROP_CASE), sense) == 0);
2834
2835 if (is_ci)
2836 *is_ci = (sense == ZFS_CASE_INSENSITIVE);
2837
2838 return (0);
2839 }
2840
2841 static int
2842 zfs_fill_zplprops(const char *dataset, nvlist_t *createprops,
2843 nvlist_t *zplprops, boolean_t *is_ci)
2844 {
2845 boolean_t fuids_ok, sa_ok;
2846 uint64_t zplver = ZPL_VERSION;
2847 objset_t *os = NULL;
2848 char parentname[MAXNAMELEN];
2849 char *cp;
2850 spa_t *spa;
2851 uint64_t spa_vers;
2852 int error;
2853
2854 (void) strlcpy(parentname, dataset, sizeof (parentname));
2855 cp = strrchr(parentname, '/');
2856 ASSERT(cp != NULL);
2857 cp[0] = '\0';
2858
2859 if ((error = spa_open(dataset, &spa, FTAG)) != 0)
2860 return (error);
2861
2862 spa_vers = spa_version(spa);
2863 spa_close(spa, FTAG);
2864
2865 zplver = zfs_zpl_version_map(spa_vers);
2866 fuids_ok = (zplver >= ZPL_VERSION_FUID);
2867 sa_ok = (zplver >= ZPL_VERSION_SA);
2868
2869 /*
2870 * Open parent object set so we can inherit zplprop values.
2871 */
2872 if ((error = dmu_objset_hold(parentname, FTAG, &os)) != 0)
2873 return (error);
2874
2875 error = zfs_fill_zplprops_impl(os, zplver, fuids_ok, sa_ok, createprops,
2876 zplprops, is_ci);
2877 dmu_objset_rele(os, FTAG);
2878 return (error);
2879 }
2880
2881 static int
2882 zfs_fill_zplprops_root(uint64_t spa_vers, nvlist_t *createprops,
2883 nvlist_t *zplprops, boolean_t *is_ci)
2884 {
2885 boolean_t fuids_ok;
2886 boolean_t sa_ok;
2887 uint64_t zplver = ZPL_VERSION;
2888 int error;
2889
2890 zplver = zfs_zpl_version_map(spa_vers);
2891 fuids_ok = (zplver >= ZPL_VERSION_FUID);
2892 sa_ok = (zplver >= ZPL_VERSION_SA);
2893
2894 error = zfs_fill_zplprops_impl(NULL, zplver, fuids_ok, sa_ok,
2895 createprops, zplprops, is_ci);
2896 return (error);
2897 }
2898
2899 /*
2900 * inputs:
2901 * zc_objset_type type of objset to create (fs vs zvol)
2902 * zc_name name of new objset
2903 * zc_value name of snapshot to clone from (may be empty)
2904 * zc_nvlist_src{_size} nvlist of properties to apply
2905 *
2906 * outputs: none
2907 */
2908 static int
2909 zfs_ioc_create(zfs_cmd_t *zc)
2910 {
2911 objset_t *clone;
2912 int error = 0;
2913 zfs_creat_t zct;
2914 nvlist_t *nvprops = NULL;
2915 void (*cbfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx);
2916 dmu_objset_type_t type = zc->zc_objset_type;
2917
2918 switch (type) {
2919
2920 case DMU_OST_ZFS:
2921 cbfunc = zfs_create_cb;
2922 break;
2923
2924 case DMU_OST_ZVOL:
2925 cbfunc = zvol_create_cb;
2926 break;
2927
2928 default:
2929 cbfunc = NULL;
2930 break;
2931 }
2932 if (strchr(zc->zc_name, '@') ||
2933 strchr(zc->zc_name, '%'))
2934 return (EINVAL);
2935
2936 if (zc->zc_nvlist_src != 0 &&
2937 (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
2938 zc->zc_iflags, &nvprops)) != 0)
2939 return (error);
2940
2941 zct.zct_zplprops = NULL;
2942 zct.zct_props = nvprops;
2943
2944 if (zc->zc_value[0] != '\0') {
2945 /*
2946 * We're creating a clone of an existing snapshot.
2947 */
2948 zc->zc_value[sizeof (zc->zc_value) - 1] = '\0';
2949 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0) {
2950 nvlist_free(nvprops);
2951 return (EINVAL);
2952 }
2953
2954 error = dmu_objset_hold(zc->zc_value, FTAG, &clone);
2955 if (error) {
2956 nvlist_free(nvprops);
2957 return (error);
2958 }
2959
2960 error = dmu_objset_clone(zc->zc_name, dmu_objset_ds(clone), 0);
2961 dmu_objset_rele(clone, FTAG);
2962 if (error) {
2963 nvlist_free(nvprops);
2964 return (error);
2965 }
2966 } else {
2967 boolean_t is_insensitive = B_FALSE;
2968
2969 if (cbfunc == NULL) {
2970 nvlist_free(nvprops);
2971 return (EINVAL);
2972 }
2973
2974 if (type == DMU_OST_ZVOL) {
2975 uint64_t volsize, volblocksize;
2976
2977 if (nvprops == NULL ||
2978 nvlist_lookup_uint64(nvprops,
2979 zfs_prop_to_name(ZFS_PROP_VOLSIZE),
2980 &volsize) != 0) {
2981 nvlist_free(nvprops);
2982 return (EINVAL);
2983 }
2984
2985 if ((error = nvlist_lookup_uint64(nvprops,
2986 zfs_prop_to_name(ZFS_PROP_VOLBLOCKSIZE),
2987 &volblocksize)) != 0 && error != ENOENT) {
2988 nvlist_free(nvprops);
2989 return (EINVAL);
2990 }
2991
2992 if (error != 0)
2993 volblocksize = zfs_prop_default_numeric(
2994 ZFS_PROP_VOLBLOCKSIZE);
2995
2996 if ((error = zvol_check_volblocksize(
2997 volblocksize)) != 0 ||
2998 (error = zvol_check_volsize(volsize,
2999 volblocksize)) != 0) {
3000 nvlist_free(nvprops);
3001 return (error);
3002 }
3003 } else if (type == DMU_OST_ZFS) {
3004 int error;
3005
3006 /*
3007 * We have to have normalization and
3008 * case-folding flags correct when we do the
3009 * file system creation, so go figure them out
3010 * now.
3011 */
3012 VERIFY(nvlist_alloc(&zct.zct_zplprops,
3013 NV_UNIQUE_NAME, KM_SLEEP) == 0);
3014 error = zfs_fill_zplprops(zc->zc_name, nvprops,
3015 zct.zct_zplprops, &is_insensitive);
3016 if (error != 0) {
3017 nvlist_free(nvprops);
3018 nvlist_free(zct.zct_zplprops);
3019 return (error);
3020 }
3021 }
3022 error = dmu_objset_create(zc->zc_name, type,
3023 is_insensitive ? DS_FLAG_CI_DATASET : 0, cbfunc, &zct);
3024 nvlist_free(zct.zct_zplprops);
3025 }
3026
3027 /*
3028 * It would be nice to do this atomically.
3029 */
3030 if (error == 0) {
3031 error = zfs_set_prop_nvlist(zc->zc_name, ZPROP_SRC_LOCAL,
3032 nvprops, NULL);
3033 if (error != 0)
3034 (void) dmu_objset_destroy(zc->zc_name, B_FALSE);
3035 }
3036 nvlist_free(nvprops);
3037 return (error);
3038 }
3039
3040 /*
3041 * inputs:
3042 * zc_name name of filesystem
3043 * zc_value short name of snapshot
3044 * zc_cookie recursive flag
3045 * zc_nvlist_src[_size] property list
3046 *
3047 * outputs:
3048 * zc_value short snapname (i.e. part after the '@')
3049 */
3050 static int
3051 zfs_ioc_snapshot(zfs_cmd_t *zc)
3052 {
3053 nvlist_t *nvprops = NULL;
3054 int error;
3055 boolean_t recursive = zc->zc_cookie;
3056
3057 if (snapshot_namecheck(zc->zc_value, NULL, NULL) != 0)
3058 return (EINVAL);
3059
3060 if (zc->zc_nvlist_src != 0 &&
3061 (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
3062 zc->zc_iflags, &nvprops)) != 0)
3063 return (error);
3064
3065 error = zfs_check_userprops(zc->zc_name, nvprops);
3066 if (error)
3067 goto out;
3068
3069 if (!nvlist_empty(nvprops) &&
3070 zfs_earlier_version(zc->zc_name, SPA_VERSION_SNAP_PROPS)) {
3071 error = ENOTSUP;
3072 goto out;
3073 }
3074
3075 error = dmu_objset_snapshot(zc->zc_name, zc->zc_value, NULL,
3076 nvprops, recursive, B_FALSE, -1);
3077
3078 out:
3079 nvlist_free(nvprops);
3080 return (error);
3081 }
3082
3083 /*
3084 * inputs:
3085 * name dataset name, or when 'arg == NULL' the full snapshot name
3086 * arg short snapshot name (i.e. part after the '@')
3087 */
3088 int
3089 zfs_unmount_snap(const char *name, void *arg)
3090 {
3091 zfs_sb_t *zsb = NULL;
3092 char *dsname;
3093 char *snapname;
3094 char *fullname;
3095 char *ptr;
3096 int error;
3097
3098 if (arg) {
3099 dsname = strdup(name);
3100 snapname = strdup(arg);
3101 } else {
3102 ptr = strchr(name, '@');
3103 if (ptr) {
3104 dsname = strdup(name);
3105 dsname[ptr - name] = '\0';
3106 snapname = strdup(ptr + 1);
3107 } else {
3108 return (0);
3109 }
3110 }
3111
3112 fullname = kmem_asprintf("%s@%s", dsname, snapname);
3113
3114 error = zfs_sb_hold(dsname, FTAG, &zsb, B_FALSE);
3115 if (error == 0) {
3116 error = zfsctl_unmount_snapshot(zsb, fullname, MNT_FORCE);
3117 zfs_sb_rele(zsb, FTAG);
3118
3119 /* Allow ENOENT for consistency with upstream */
3120 if (error == ENOENT)
3121 error = 0;
3122 }
3123
3124 strfree(dsname);
3125 strfree(snapname);
3126 strfree(fullname);
3127
3128 return (error);
3129 }
3130
3131 /*
3132 * inputs:
3133 * zc_name name of filesystem, snaps must be under it
3134 * zc_nvlist_src[_size] full names of snapshots to destroy
3135 * zc_defer_destroy mark for deferred destroy
3136 *
3137 * outputs:
3138 * zc_name on failure, name of failed snapshot
3139 */
3140 static int
3141 zfs_ioc_destroy_snaps_nvl(zfs_cmd_t *zc)
3142 {
3143 int err, len;
3144 nvlist_t *nvl;
3145 nvpair_t *pair;
3146
3147 if ((err = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
3148 zc->zc_iflags, &nvl)) != 0)
3149 return (err);
3150
3151 len = strlen(zc->zc_name);
3152 for (pair = nvlist_next_nvpair(nvl, NULL); pair != NULL;
3153 pair = nvlist_next_nvpair(nvl, pair)) {
3154 const char *name = nvpair_name(pair);
3155 /*
3156 * The snap name must be underneath the zc_name. This ensures
3157 * that our permission checks were legitimate.
3158 */
3159 if (strncmp(zc->zc_name, name, len) != 0 ||
3160 (name[len] != '@' && name[len] != '/')) {
3161 nvlist_free(nvl);
3162 return (EINVAL);
3163 }
3164
3165 (void) zfs_unmount_snap(name, NULL);
3166 (void) zvol_remove_minor(name);
3167 }
3168
3169 err = dmu_snapshots_destroy_nvl(nvl, zc->zc_defer_destroy,
3170 zc->zc_name);
3171 nvlist_free(nvl);
3172 return (err);
3173 }
3174
3175 /*
3176 * inputs:
3177 * zc_name name of dataset to destroy
3178 * zc_objset_type type of objset
3179 * zc_defer_destroy mark for deferred destroy
3180 *
3181 * outputs: none
3182 */
3183 static int
3184 zfs_ioc_destroy(zfs_cmd_t *zc)
3185 {
3186 int err;
3187 if (strchr(zc->zc_name, '@') && zc->zc_objset_type == DMU_OST_ZFS) {
3188 err = zfs_unmount_snap(zc->zc_name, NULL);
3189 if (err)
3190 return (err);
3191 }
3192
3193 err = dmu_objset_destroy(zc->zc_name, zc->zc_defer_destroy);
3194 if (zc->zc_objset_type == DMU_OST_ZVOL && err == 0)
3195 (void) zvol_remove_minor(zc->zc_name);
3196 return (err);
3197 }
3198
3199 /*
3200 * inputs:
3201 * zc_name name of dataset to rollback (to most recent snapshot)
3202 *
3203 * outputs: none
3204 */
3205 static int
3206 zfs_ioc_rollback(zfs_cmd_t *zc)
3207 {
3208 dsl_dataset_t *ds, *clone;
3209 int error;
3210 zfs_sb_t *zsb;
3211 char *clone_name;
3212
3213 error = dsl_dataset_hold(zc->zc_name, FTAG, &ds);
3214 if (error)
3215 return (error);
3216
3217 /* must not be a snapshot */
3218 if (dsl_dataset_is_snapshot(ds)) {
3219 dsl_dataset_rele(ds, FTAG);
3220 return (EINVAL);
3221 }
3222
3223 /* must have a most recent snapshot */
3224 if (ds->ds_phys->ds_prev_snap_txg < TXG_INITIAL) {
3225 dsl_dataset_rele(ds, FTAG);
3226 return (EINVAL);
3227 }
3228
3229 /*
3230 * Create clone of most recent snapshot.
3231 */
3232 clone_name = kmem_asprintf("%s/%%rollback", zc->zc_name);
3233 error = dmu_objset_clone(clone_name, ds->ds_prev, DS_FLAG_INCONSISTENT);
3234 if (error)
3235 goto out;
3236
3237 error = dsl_dataset_own(clone_name, B_TRUE, FTAG, &clone);
3238 if (error)
3239 goto out;
3240
3241 /*
3242 * Do clone swap.
3243 */
3244 if (get_zfs_sb(zc->zc_name, &zsb) == 0) {
3245 error = zfs_suspend_fs(zsb);
3246 if (error == 0) {
3247 int resume_err;
3248
3249 if (dsl_dataset_tryown(ds, B_FALSE, FTAG)) {
3250 error = dsl_dataset_clone_swap(clone, ds,
3251 B_TRUE);
3252 dsl_dataset_disown(ds, FTAG);
3253 ds = NULL;
3254 } else {
3255 error = EBUSY;
3256 }
3257 resume_err = zfs_resume_fs(zsb, zc->zc_name);
3258 error = error ? error : resume_err;
3259 }
3260 deactivate_super(zsb->z_sb);
3261 } else {
3262 if (dsl_dataset_tryown(ds, B_FALSE, FTAG)) {
3263 error = dsl_dataset_clone_swap(clone, ds, B_TRUE);
3264 dsl_dataset_disown(ds, FTAG);
3265 ds = NULL;
3266 } else {
3267 error = EBUSY;
3268 }
3269 }
3270
3271 /*
3272 * Destroy clone (which also closes it).
3273 */
3274 (void) dsl_dataset_destroy(clone, FTAG, B_FALSE);
3275
3276 out:
3277 strfree(clone_name);
3278 if (ds)
3279 dsl_dataset_rele(ds, FTAG);
3280 return (error);
3281 }
3282
3283 /*
3284 * inputs:
3285 * zc_name old name of dataset
3286 * zc_value new name of dataset
3287 * zc_cookie recursive flag (only valid for snapshots)
3288 *
3289 * outputs: none
3290 */
3291 static int
3292 zfs_ioc_rename(zfs_cmd_t *zc)
3293 {
3294 boolean_t recursive = zc->zc_cookie & 1;
3295 int err;
3296
3297 zc->zc_value[sizeof (zc->zc_value) - 1] = '\0';
3298 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3299 strchr(zc->zc_value, '%'))
3300 return (EINVAL);
3301
3302 /*
3303 * Unmount snapshot unless we're doing a recursive rename,
3304 * in which case the dataset code figures out which snapshots
3305 * to unmount.
3306 */
3307 if (!recursive && strchr(zc->zc_name, '@') != NULL &&
3308 zc->zc_objset_type == DMU_OST_ZFS) {
3309 err = zfs_unmount_snap(zc->zc_name, NULL);
3310 if (err)
3311 return (err);
3312 }
3313
3314 err = dmu_objset_rename(zc->zc_name, zc->zc_value, recursive);
3315 if ((err == 0) && (zc->zc_objset_type == DMU_OST_ZVOL)) {
3316 (void) zvol_remove_minor(zc->zc_name);
3317 (void) zvol_create_minor(zc->zc_value);
3318 }
3319
3320 return (err);
3321 }
3322
3323 static int
3324 zfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
3325 {
3326 const char *propname = nvpair_name(pair);
3327 boolean_t issnap = (strchr(dsname, '@') != NULL);
3328 zfs_prop_t prop = zfs_name_to_prop(propname);
3329 uint64_t intval;
3330 int err;
3331
3332 if (prop == ZPROP_INVAL) {
3333 if (zfs_prop_user(propname)) {
3334 if ((err = zfs_secpolicy_write_perms(dsname,
3335 ZFS_DELEG_PERM_USERPROP, cr)))
3336 return (err);
3337 return (0);
3338 }
3339
3340 if (!issnap && zfs_prop_userquota(propname)) {
3341 const char *perm = NULL;
3342 const char *uq_prefix =
3343 zfs_userquota_prop_prefixes[ZFS_PROP_USERQUOTA];
3344 const char *gq_prefix =
3345 zfs_userquota_prop_prefixes[ZFS_PROP_GROUPQUOTA];
3346
3347 if (strncmp(propname, uq_prefix,
3348 strlen(uq_prefix)) == 0) {
3349 perm = ZFS_DELEG_PERM_USERQUOTA;
3350 } else if (strncmp(propname, gq_prefix,
3351 strlen(gq_prefix)) == 0) {
3352 perm = ZFS_DELEG_PERM_GROUPQUOTA;
3353 } else {
3354 /* USERUSED and GROUPUSED are read-only */
3355 return (EINVAL);
3356 }
3357
3358 if ((err = zfs_secpolicy_write_perms(dsname, perm, cr)))
3359 return (err);
3360 return (0);
3361 }
3362
3363 return (EINVAL);
3364 }
3365
3366 if (issnap)
3367 return (EINVAL);
3368
3369 if (nvpair_type(pair) == DATA_TYPE_NVLIST) {
3370 /*
3371 * dsl_prop_get_all_impl() returns properties in this
3372 * format.
3373 */
3374 nvlist_t *attrs;
3375 VERIFY(nvpair_value_nvlist(pair, &attrs) == 0);
3376 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3377 &pair) == 0);
3378 }
3379
3380 /*
3381 * Check that this value is valid for this pool version
3382 */
3383 switch (prop) {
3384 case ZFS_PROP_COMPRESSION:
3385 /*
3386 * If the user specified gzip compression, make sure
3387 * the SPA supports it. We ignore any errors here since
3388 * we'll catch them later.
3389 */
3390 if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3391 nvpair_value_uint64(pair, &intval) == 0) {
3392 if (intval >= ZIO_COMPRESS_GZIP_1 &&
3393 intval <= ZIO_COMPRESS_GZIP_9 &&
3394 zfs_earlier_version(dsname,
3395 SPA_VERSION_GZIP_COMPRESSION)) {
3396 return (ENOTSUP);
3397 }
3398
3399 if (intval == ZIO_COMPRESS_ZLE &&
3400 zfs_earlier_version(dsname,
3401 SPA_VERSION_ZLE_COMPRESSION))
3402 return (ENOTSUP);
3403
3404 /*
3405 * If this is a bootable dataset then
3406 * verify that the compression algorithm
3407 * is supported for booting. We must return
3408 * something other than ENOTSUP since it
3409 * implies a downrev pool version.
3410 */
3411 if (zfs_is_bootfs(dsname) &&
3412 !BOOTFS_COMPRESS_VALID(intval)) {
3413 return (ERANGE);
3414 }
3415 }
3416 break;
3417
3418 case ZFS_PROP_COPIES:
3419 if (zfs_earlier_version(dsname, SPA_VERSION_DITTO_BLOCKS))
3420 return (ENOTSUP);
3421 break;
3422
3423 case ZFS_PROP_DEDUP:
3424 if (zfs_earlier_version(dsname, SPA_VERSION_DEDUP))
3425 return (ENOTSUP);
3426 break;
3427
3428 case ZFS_PROP_SHARESMB:
3429 if (zpl_earlier_version(dsname, ZPL_VERSION_FUID))
3430 return (ENOTSUP);
3431 break;
3432
3433 case ZFS_PROP_ACLINHERIT:
3434 if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
3435 nvpair_value_uint64(pair, &intval) == 0) {
3436 if (intval == ZFS_ACL_PASSTHROUGH_X &&
3437 zfs_earlier_version(dsname,
3438 SPA_VERSION_PASSTHROUGH_X))
3439 return (ENOTSUP);
3440 }
3441 break;
3442 default:
3443 break;
3444 }
3445
3446 return (zfs_secpolicy_setprop(dsname, prop, pair, CRED()));
3447 }
3448
3449 /*
3450 * Removes properties from the given props list that fail permission checks
3451 * needed to clear them and to restore them in case of a receive error. For each
3452 * property, make sure we have both set and inherit permissions.
3453 *
3454 * Returns the first error encountered if any permission checks fail. If the
3455 * caller provides a non-NULL errlist, it also gives the complete list of names
3456 * of all the properties that failed a permission check along with the
3457 * corresponding error numbers. The caller is responsible for freeing the
3458 * returned errlist.
3459 *
3460 * If every property checks out successfully, zero is returned and the list
3461 * pointed at by errlist is NULL.
3462 */
3463 static int
3464 zfs_check_clearable(char *dataset, nvlist_t *props, nvlist_t **errlist)
3465 {
3466 zfs_cmd_t *zc;
3467 nvpair_t *pair, *next_pair;
3468 nvlist_t *errors;
3469 int err, rv = 0;
3470
3471 if (props == NULL)
3472 return (0);
3473
3474 VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
3475
3476 zc = kmem_alloc(sizeof (zfs_cmd_t), KM_SLEEP | KM_NODEBUG);
3477 (void) strcpy(zc->zc_name, dataset);
3478 pair = nvlist_next_nvpair(props, NULL);
3479 while (pair != NULL) {
3480 next_pair = nvlist_next_nvpair(props, pair);
3481
3482 (void) strcpy(zc->zc_value, nvpair_name(pair));
3483 if ((err = zfs_check_settable(dataset, pair, CRED())) != 0 ||
3484 (err = zfs_secpolicy_inherit(zc, CRED())) != 0) {
3485 VERIFY(nvlist_remove_nvpair(props, pair) == 0);
3486 VERIFY(nvlist_add_int32(errors,
3487 zc->zc_value, err) == 0);
3488 }
3489 pair = next_pair;
3490 }
3491 kmem_free(zc, sizeof (zfs_cmd_t));
3492
3493 if ((pair = nvlist_next_nvpair(errors, NULL)) == NULL) {
3494 nvlist_free(errors);
3495 errors = NULL;
3496 } else {
3497 VERIFY(nvpair_value_int32(pair, &rv) == 0);
3498 }
3499
3500 if (errlist == NULL)
3501 nvlist_free(errors);
3502 else
3503 *errlist = errors;
3504
3505 return (rv);
3506 }
3507
3508 static boolean_t
3509 propval_equals(nvpair_t *p1, nvpair_t *p2)
3510 {
3511 if (nvpair_type(p1) == DATA_TYPE_NVLIST) {
3512 /* dsl_prop_get_all_impl() format */
3513 nvlist_t *attrs;
3514 VERIFY(nvpair_value_nvlist(p1, &attrs) == 0);
3515 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3516 &p1) == 0);
3517 }
3518
3519 if (nvpair_type(p2) == DATA_TYPE_NVLIST) {
3520 nvlist_t *attrs;
3521 VERIFY(nvpair_value_nvlist(p2, &attrs) == 0);
3522 VERIFY(nvlist_lookup_nvpair(attrs, ZPROP_VALUE,
3523 &p2) == 0);
3524 }
3525
3526 if (nvpair_type(p1) != nvpair_type(p2))
3527 return (B_FALSE);
3528
3529 if (nvpair_type(p1) == DATA_TYPE_STRING) {
3530 char *valstr1, *valstr2;
3531
3532 VERIFY(nvpair_value_string(p1, (char **)&valstr1) == 0);
3533 VERIFY(nvpair_value_string(p2, (char **)&valstr2) == 0);
3534 return (strcmp(valstr1, valstr2) == 0);
3535 } else {
3536 uint64_t intval1, intval2;
3537
3538 VERIFY(nvpair_value_uint64(p1, &intval1) == 0);
3539 VERIFY(nvpair_value_uint64(p2, &intval2) == 0);
3540 return (intval1 == intval2);
3541 }
3542 }
3543
3544 /*
3545 * Remove properties from props if they are not going to change (as determined
3546 * by comparison with origprops). Remove them from origprops as well, since we
3547 * do not need to clear or restore properties that won't change.
3548 */
3549 static void
3550 props_reduce(nvlist_t *props, nvlist_t *origprops)
3551 {
3552 nvpair_t *pair, *next_pair;
3553
3554 if (origprops == NULL)
3555 return; /* all props need to be received */
3556
3557 pair = nvlist_next_nvpair(props, NULL);
3558 while (pair != NULL) {
3559 const char *propname = nvpair_name(pair);
3560 nvpair_t *match;
3561
3562 next_pair = nvlist_next_nvpair(props, pair);
3563
3564 if ((nvlist_lookup_nvpair(origprops, propname,
3565 &match) != 0) || !propval_equals(pair, match))
3566 goto next; /* need to set received value */
3567
3568 /* don't clear the existing received value */
3569 (void) nvlist_remove_nvpair(origprops, match);
3570 /* don't bother receiving the property */
3571 (void) nvlist_remove_nvpair(props, pair);
3572 next:
3573 pair = next_pair;
3574 }
3575 }
3576
3577 #ifdef DEBUG
3578 static boolean_t zfs_ioc_recv_inject_err;
3579 #endif
3580
3581 /*
3582 * inputs:
3583 * zc_name name of containing filesystem
3584 * zc_nvlist_src{_size} nvlist of properties to apply
3585 * zc_value name of snapshot to create
3586 * zc_string name of clone origin (if DRR_FLAG_CLONE)
3587 * zc_cookie file descriptor to recv from
3588 * zc_begin_record the BEGIN record of the stream (not byteswapped)
3589 * zc_guid force flag
3590 * zc_cleanup_fd cleanup-on-exit file descriptor
3591 * zc_action_handle handle for this guid/ds mapping (or zero on first call)
3592 *
3593 * outputs:
3594 * zc_cookie number of bytes read
3595 * zc_nvlist_dst{_size} error for each unapplied received property
3596 * zc_obj zprop_errflags_t
3597 * zc_action_handle handle for this guid/ds mapping
3598 */
3599 static int
3600 zfs_ioc_recv(zfs_cmd_t *zc)
3601 {
3602 file_t *fp;
3603 objset_t *os;
3604 dmu_recv_cookie_t drc;
3605 boolean_t force = (boolean_t)zc->zc_guid;
3606 int fd;
3607 int error = 0;
3608 int props_error = 0;
3609 nvlist_t *errors;
3610 offset_t off;
3611 nvlist_t *props = NULL; /* sent properties */
3612 nvlist_t *origprops = NULL; /* existing properties */
3613 objset_t *origin = NULL;
3614 char *tosnap;
3615 char tofs[ZFS_MAXNAMELEN];
3616 boolean_t first_recvd_props = B_FALSE;
3617
3618 if (dataset_namecheck(zc->zc_value, NULL, NULL) != 0 ||
3619 strchr(zc->zc_value, '@') == NULL ||
3620 strchr(zc->zc_value, '%'))
3621 return (EINVAL);
3622
3623 (void) strcpy(tofs, zc->zc_value);
3624 tosnap = strchr(tofs, '@');
3625 *tosnap++ = '\0';
3626
3627 if (zc->zc_nvlist_src != 0 &&
3628 (error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
3629 zc->zc_iflags, &props)) != 0)
3630 return (error);
3631
3632 fd = zc->zc_cookie;
3633 fp = getf(fd);
3634 if (fp == NULL) {
3635 nvlist_free(props);
3636 return (EBADF);
3637 }
3638
3639 VERIFY(nvlist_alloc(&errors, NV_UNIQUE_NAME, KM_SLEEP) == 0);
3640
3641 if (props && dmu_objset_hold(tofs, FTAG, &os) == 0) {
3642 if ((spa_version(os->os_spa) >= SPA_VERSION_RECVD_PROPS) &&
3643 !dsl_prop_get_hasrecvd(os)) {
3644 first_recvd_props = B_TRUE;
3645 }
3646
3647 /*
3648 * If new received properties are supplied, they are to
3649 * completely replace the existing received properties, so stash
3650 * away the existing ones.
3651 */
3652 if (dsl_prop_get_received(os, &origprops) == 0) {
3653 nvlist_t *errlist = NULL;
3654 /*
3655 * Don't bother writing a property if its value won't
3656 * change (and avoid the unnecessary security checks).
3657 *
3658 * The first receive after SPA_VERSION_RECVD_PROPS is a
3659 * special case where we blow away all local properties
3660 * regardless.
3661 */
3662 if (!first_recvd_props)
3663 props_reduce(props, origprops);
3664 if (zfs_check_clearable(tofs, origprops,
3665 &errlist) != 0)
3666 (void) nvlist_merge(errors, errlist, 0);
3667 nvlist_free(errlist);
3668 }
3669
3670 dmu_objset_rele(os, FTAG);
3671 }
3672
3673 if (zc->zc_string[0]) {
3674 error = dmu_objset_hold(zc->zc_string, FTAG, &origin);
3675 if (error)
3676 goto out;
3677 }
3678
3679 error = dmu_recv_begin(tofs, tosnap, zc->zc_top_ds,
3680 &zc->zc_begin_record, force, origin, &drc);
3681 if (origin)
3682 dmu_objset_rele(origin, FTAG);
3683 if (error)
3684 goto out;
3685
3686 /*
3687 * Set properties before we receive the stream so that they are applied
3688 * to the new data. Note that we must call dmu_recv_stream() if
3689 * dmu_recv_begin() succeeds.
3690 */
3691 if (props) {
3692 nvlist_t *errlist;
3693
3694 if (dmu_objset_from_ds(drc.drc_logical_ds, &os) == 0) {
3695 if (drc.drc_newfs) {
3696 if (spa_version(os->os_spa) >=
3697 SPA_VERSION_RECVD_PROPS)
3698 first_recvd_props = B_TRUE;
3699 } else if (origprops != NULL) {
3700 if (clear_received_props(os, tofs, origprops,
3701 first_recvd_props ? NULL : props) != 0)
3702 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
3703 } else {
3704 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
3705 }
3706 dsl_prop_set_hasrecvd(os);
3707 } else if (!drc.drc_newfs) {
3708 zc->zc_obj |= ZPROP_ERR_NOCLEAR;
3709 }
3710
3711 (void) zfs_set_prop_nvlist(tofs, ZPROP_SRC_RECEIVED,
3712 props, &errlist);
3713 (void) nvlist_merge(errors, errlist, 0);
3714 nvlist_free(errlist);
3715 }
3716
3717 if (fit_error_list(zc, &errors) != 0 || put_nvlist(zc, errors) != 0) {
3718 /*
3719 * Caller made zc->zc_nvlist_dst less than the minimum expected
3720 * size or supplied an invalid address.
3721 */
3722 props_error = EINVAL;
3723 }
3724
3725 off = fp->f_offset;
3726 error = dmu_recv_stream(&drc, fp->f_vnode, &off, zc->zc_cleanup_fd,
3727 &zc->zc_action_handle);
3728
3729 if (error == 0) {
3730 zfs_sb_t *zsb = NULL;
3731
3732 if (get_zfs_sb(tofs, &zsb) == 0) {
3733 /* online recv */
3734 int end_err;
3735
3736 error = zfs_suspend_fs(zsb);
3737 /*
3738 * If the suspend fails, then the recv_end will
3739 * likely also fail, and clean up after itself.
3740 */
3741 end_err = dmu_recv_end(&drc);
3742 if (error == 0)
3743 error = zfs_resume_fs(zsb, tofs);
3744 error = error ? error : end_err;
3745 deactivate_super(zsb->z_sb);
3746 } else {
3747 error = dmu_recv_end(&drc);
3748 }
3749 }
3750
3751 zc->zc_cookie = off - fp->f_offset;
3752 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
3753 fp->f_offset = off;
3754
3755 #ifdef DEBUG
3756 if (zfs_ioc_recv_inject_err) {
3757 zfs_ioc_recv_inject_err = B_FALSE;
3758 error = 1;
3759 }
3760 #endif
3761 /*
3762 * On error, restore the original props.
3763 */
3764 if (error && props) {
3765 if (dmu_objset_hold(tofs, FTAG, &os) == 0) {
3766 if (clear_received_props(os, tofs, props, NULL) != 0) {
3767 /*
3768 * We failed to clear the received properties.
3769 * Since we may have left a $recvd value on the
3770 * system, we can't clear the $hasrecvd flag.
3771 */
3772 zc->zc_obj |= ZPROP_ERR_NORESTORE;
3773 } else if (first_recvd_props) {
3774 dsl_prop_unset_hasrecvd(os);
3775 }
3776 dmu_objset_rele(os, FTAG);
3777 } else if (!drc.drc_newfs) {
3778 /* We failed to clear the received properties. */
3779 zc->zc_obj |= ZPROP_ERR_NORESTORE;
3780 }
3781
3782 if (origprops == NULL && !drc.drc_newfs) {
3783 /* We failed to stash the original properties. */
3784 zc->zc_obj |= ZPROP_ERR_NORESTORE;
3785 }
3786
3787 /*
3788 * dsl_props_set() will not convert RECEIVED to LOCAL on or
3789 * after SPA_VERSION_RECVD_PROPS, so we need to specify LOCAL
3790 * explictly if we're restoring local properties cleared in the
3791 * first new-style receive.
3792 */
3793 if (origprops != NULL &&
3794 zfs_set_prop_nvlist(tofs, (first_recvd_props ?
3795 ZPROP_SRC_LOCAL : ZPROP_SRC_RECEIVED),
3796 origprops, NULL) != 0) {
3797 /*
3798 * We stashed the original properties but failed to
3799 * restore them.
3800 */
3801 zc->zc_obj |= ZPROP_ERR_NORESTORE;
3802 }
3803 }
3804 out:
3805 nvlist_free(props);
3806 nvlist_free(origprops);
3807 nvlist_free(errors);
3808 releasef(fd);
3809
3810 if (error == 0)
3811 error = props_error;
3812
3813 return (error);
3814 }
3815
3816 /*
3817 * inputs:
3818 * zc_name name of snapshot to send
3819 * zc_cookie file descriptor to send stream to
3820 * zc_obj fromorigin flag (mutually exclusive with zc_fromobj)
3821 * zc_sendobj objsetid of snapshot to send
3822 * zc_fromobj objsetid of incremental fromsnap (may be zero)
3823 * zc_guid if set, estimate size of stream only. zc_cookie is ignored.
3824 * output size in zc_objset_type.
3825 *
3826 * outputs: none
3827 */
3828 static int
3829 zfs_ioc_send(zfs_cmd_t *zc)
3830 {
3831 objset_t *fromsnap = NULL;
3832 objset_t *tosnap;
3833 int error;
3834 offset_t off;
3835 dsl_dataset_t *ds;
3836 dsl_dataset_t *dsfrom = NULL;
3837 spa_t *spa;
3838 dsl_pool_t *dp;
3839 boolean_t estimate = (zc->zc_guid != 0);
3840
3841 error = spa_open(zc->zc_name, &spa, FTAG);
3842 if (error)
3843 return (error);
3844
3845 dp = spa_get_dsl(spa);
3846 rw_enter(&dp->dp_config_rwlock, RW_READER);
3847 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
3848 rw_exit(&dp->dp_config_rwlock);
3849 if (error) {
3850 spa_close(spa, FTAG);
3851 return (error);
3852 }
3853
3854 error = dmu_objset_from_ds(ds, &tosnap);
3855 if (error) {
3856 dsl_dataset_rele(ds, FTAG);
3857 spa_close(spa, FTAG);
3858 return (error);
3859 }
3860
3861 if (zc->zc_fromobj != 0) {
3862 rw_enter(&dp->dp_config_rwlock, RW_READER);
3863 error = dsl_dataset_hold_obj(dp, zc->zc_fromobj, FTAG, &dsfrom);
3864 rw_exit(&dp->dp_config_rwlock);
3865 spa_close(spa, FTAG);
3866 if (error) {
3867 dsl_dataset_rele(ds, FTAG);
3868 return (error);
3869 }
3870 error = dmu_objset_from_ds(dsfrom, &fromsnap);
3871 if (error) {
3872 dsl_dataset_rele(dsfrom, FTAG);
3873 dsl_dataset_rele(ds, FTAG);
3874 return (error);
3875 }
3876 } else {
3877 spa_close(spa, FTAG);
3878 }
3879
3880 if (estimate) {
3881 error = dmu_send_estimate(tosnap, fromsnap, zc->zc_obj,
3882 &zc->zc_objset_type);
3883 } else {
3884 file_t *fp = getf(zc->zc_cookie);
3885 if (fp == NULL) {
3886 dsl_dataset_rele(ds, FTAG);
3887 if (dsfrom)
3888 dsl_dataset_rele(dsfrom, FTAG);
3889 return (EBADF);
3890 }
3891
3892 off = fp->f_offset;
3893 error = dmu_sendbackup(tosnap, fromsnap, zc->zc_obj,
3894 fp->f_vnode, &off);
3895
3896 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
3897 fp->f_offset = off;
3898 releasef(zc->zc_cookie);
3899 }
3900 if (dsfrom)
3901 dsl_dataset_rele(dsfrom, FTAG);
3902 dsl_dataset_rele(ds, FTAG);
3903 return (error);
3904 }
3905
3906 static int
3907 zfs_ioc_inject_fault(zfs_cmd_t *zc)
3908 {
3909 int id, error;
3910
3911 error = zio_inject_fault(zc->zc_name, (int)zc->zc_guid, &id,
3912 &zc->zc_inject_record);
3913
3914 if (error == 0)
3915 zc->zc_guid = (uint64_t)id;
3916
3917 return (error);
3918 }
3919
3920 static int
3921 zfs_ioc_clear_fault(zfs_cmd_t *zc)
3922 {
3923 return (zio_clear_fault((int)zc->zc_guid));
3924 }
3925
3926 static int
3927 zfs_ioc_inject_list_next(zfs_cmd_t *zc)
3928 {
3929 int id = (int)zc->zc_guid;
3930 int error;
3931
3932 error = zio_inject_list_next(&id, zc->zc_name, sizeof (zc->zc_name),
3933 &zc->zc_inject_record);
3934
3935 zc->zc_guid = id;
3936
3937 return (error);
3938 }
3939
3940 static int
3941 zfs_ioc_error_log(zfs_cmd_t *zc)
3942 {
3943 spa_t *spa;
3944 int error;
3945 size_t count = (size_t)zc->zc_nvlist_dst_size;
3946
3947 if ((error = spa_open(zc->zc_name, &spa, FTAG)) != 0)
3948 return (error);
3949
3950 error = spa_get_errlog(spa, (void *)(uintptr_t)zc->zc_nvlist_dst,
3951 &count);
3952 if (error == 0)
3953 zc->zc_nvlist_dst_size = count;
3954 else
3955 zc->zc_nvlist_dst_size = spa_get_errlog_size(spa);
3956
3957 spa_close(spa, FTAG);
3958
3959 return (error);
3960 }
3961
3962 static int
3963 zfs_ioc_clear(zfs_cmd_t *zc)
3964 {
3965 spa_t *spa;
3966 vdev_t *vd;
3967 int error;
3968
3969 /*
3970 * On zpool clear we also fix up missing slogs
3971 */
3972 mutex_enter(&spa_namespace_lock);
3973 spa = spa_lookup(zc->zc_name);
3974 if (spa == NULL) {
3975 mutex_exit(&spa_namespace_lock);
3976 return (EIO);
3977 }
3978 if (spa_get_log_state(spa) == SPA_LOG_MISSING) {
3979 /* we need to let spa_open/spa_load clear the chains */
3980 spa_set_log_state(spa, SPA_LOG_CLEAR);
3981 }
3982 spa->spa_last_open_failed = 0;
3983 mutex_exit(&spa_namespace_lock);
3984
3985 if (zc->zc_cookie & ZPOOL_NO_REWIND) {
3986 error = spa_open(zc->zc_name, &spa, FTAG);
3987 } else {
3988 nvlist_t *policy;
3989 nvlist_t *config = NULL;
3990
3991 if (zc->zc_nvlist_src == 0)
3992 return (EINVAL);
3993
3994 if ((error = get_nvlist(zc->zc_nvlist_src,
3995 zc->zc_nvlist_src_size, zc->zc_iflags, &policy)) == 0) {
3996 error = spa_open_rewind(zc->zc_name, &spa, FTAG,
3997 policy, &config);
3998 if (config != NULL) {
3999 int err;
4000
4001 if ((err = put_nvlist(zc, config)) != 0)
4002 error = err;
4003 nvlist_free(config);
4004 }
4005 nvlist_free(policy);
4006 }
4007 }
4008
4009 if (error)
4010 return (error);
4011
4012 spa_vdev_state_enter(spa, SCL_NONE);
4013
4014 if (zc->zc_guid == 0) {
4015 vd = NULL;
4016 } else {
4017 vd = spa_lookup_by_guid(spa, zc->zc_guid, B_TRUE);
4018 if (vd == NULL) {
4019 (void) spa_vdev_state_exit(spa, NULL, ENODEV);
4020 spa_close(spa, FTAG);
4021 return (ENODEV);
4022 }
4023 }
4024
4025 vdev_clear(spa, vd);
4026
4027 (void) spa_vdev_state_exit(spa, NULL, 0);
4028
4029 /*
4030 * Resume any suspended I/Os.
4031 */
4032 if (zio_resume(spa) != 0)
4033 error = EIO;
4034
4035 spa_close(spa, FTAG);
4036
4037 return (error);
4038 }
4039
4040 static int
4041 zfs_ioc_pool_reopen(zfs_cmd_t *zc)
4042 {
4043 spa_t *spa;
4044 int error;
4045
4046 error = spa_open(zc->zc_name, &spa, FTAG);
4047 if (error)
4048 return (error);
4049
4050 spa_vdev_state_enter(spa, SCL_NONE);
4051 vdev_reopen(spa->spa_root_vdev);
4052 (void) spa_vdev_state_exit(spa, NULL, 0);
4053 spa_close(spa, FTAG);
4054 return (0);
4055 }
4056 /*
4057 * inputs:
4058 * zc_name name of filesystem
4059 * zc_value name of origin snapshot
4060 *
4061 * outputs:
4062 * zc_string name of conflicting snapshot, if there is one
4063 */
4064 static int
4065 zfs_ioc_promote(zfs_cmd_t *zc)
4066 {
4067 char *cp;
4068
4069 /*
4070 * We don't need to unmount *all* the origin fs's snapshots, but
4071 * it's easier.
4072 */
4073 cp = strchr(zc->zc_value, '@');
4074 if (cp)
4075 *cp = '\0';
4076 (void) dmu_objset_find(zc->zc_value,
4077 zfs_unmount_snap, NULL, DS_FIND_SNAPSHOTS);
4078 return (dsl_dataset_promote(zc->zc_name, zc->zc_string));
4079 }
4080
4081 /*
4082 * Retrieve a single {user|group}{used|quota}@... property.
4083 *
4084 * inputs:
4085 * zc_name name of filesystem
4086 * zc_objset_type zfs_userquota_prop_t
4087 * zc_value domain name (eg. "S-1-234-567-89")
4088 * zc_guid RID/UID/GID
4089 *
4090 * outputs:
4091 * zc_cookie property value
4092 */
4093 static int
4094 zfs_ioc_userspace_one(zfs_cmd_t *zc)
4095 {
4096 zfs_sb_t *zsb;
4097 int error;
4098
4099 if (zc->zc_objset_type >= ZFS_NUM_USERQUOTA_PROPS)
4100 return (EINVAL);
4101
4102 error = zfs_sb_hold(zc->zc_name, FTAG, &zsb, B_FALSE);
4103 if (error)
4104 return (error);
4105
4106 error = zfs_userspace_one(zsb,
4107 zc->zc_objset_type, zc->zc_value, zc->zc_guid, &zc->zc_cookie);
4108 zfs_sb_rele(zsb, FTAG);
4109
4110 return (error);
4111 }
4112
4113 /*
4114 * inputs:
4115 * zc_name name of filesystem
4116 * zc_cookie zap cursor
4117 * zc_objset_type zfs_userquota_prop_t
4118 * zc_nvlist_dst[_size] buffer to fill (not really an nvlist)
4119 *
4120 * outputs:
4121 * zc_nvlist_dst[_size] data buffer (array of zfs_useracct_t)
4122 * zc_cookie zap cursor
4123 */
4124 static int
4125 zfs_ioc_userspace_many(zfs_cmd_t *zc)
4126 {
4127 zfs_sb_t *zsb;
4128 int bufsize = zc->zc_nvlist_dst_size;
4129 int error;
4130 void *buf;
4131
4132 if (bufsize <= 0)
4133 return (ENOMEM);
4134
4135 error = zfs_sb_hold(zc->zc_name, FTAG, &zsb, B_FALSE);
4136 if (error)
4137 return (error);
4138
4139 buf = vmem_alloc(bufsize, KM_SLEEP);
4140
4141 error = zfs_userspace_many(zsb, zc->zc_objset_type, &zc->zc_cookie,
4142 buf, &zc->zc_nvlist_dst_size);
4143
4144 if (error == 0) {
4145 error = xcopyout(buf,
4146 (void *)(uintptr_t)zc->zc_nvlist_dst,
4147 zc->zc_nvlist_dst_size);
4148 }
4149 vmem_free(buf, bufsize);
4150 zfs_sb_rele(zsb, FTAG);
4151
4152 return (error);
4153 }
4154
4155 /*
4156 * inputs:
4157 * zc_name name of filesystem
4158 *
4159 * outputs:
4160 * none
4161 */
4162 static int
4163 zfs_ioc_userspace_upgrade(zfs_cmd_t *zc)
4164 {
4165 objset_t *os;
4166 int error = 0;
4167 zfs_sb_t *zsb;
4168
4169 if (get_zfs_sb(zc->zc_name, &zsb) == 0) {
4170 if (!dmu_objset_userused_enabled(zsb->z_os)) {
4171 /*
4172 * If userused is not enabled, it may be because the
4173 * objset needs to be closed & reopened (to grow the
4174 * objset_phys_t). Suspend/resume the fs will do that.
4175 */
4176 error = zfs_suspend_fs(zsb);
4177 if (error == 0)
4178 error = zfs_resume_fs(zsb, zc->zc_name);
4179 }
4180 if (error == 0)
4181 error = dmu_objset_userspace_upgrade(zsb->z_os);
4182 deactivate_super(zsb->z_sb);
4183 } else {
4184 /* XXX kind of reading contents without owning */
4185 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4186 if (error)
4187 return (error);
4188
4189 error = dmu_objset_userspace_upgrade(os);
4190 dmu_objset_rele(os, FTAG);
4191 }
4192
4193 return (error);
4194 }
4195
4196 static int
4197 zfs_ioc_share(zfs_cmd_t *zc)
4198 {
4199 return (ENOSYS);
4200 }
4201
4202 ace_t full_access[] = {
4203 {(uid_t)-1, ACE_ALL_PERMS, ACE_EVERYONE, 0}
4204 };
4205
4206 /*
4207 * inputs:
4208 * zc_name name of containing filesystem
4209 * zc_obj object # beyond which we want next in-use object #
4210 *
4211 * outputs:
4212 * zc_obj next in-use object #
4213 */
4214 static int
4215 zfs_ioc_next_obj(zfs_cmd_t *zc)
4216 {
4217 objset_t *os = NULL;
4218 int error;
4219
4220 error = dmu_objset_hold(zc->zc_name, FTAG, &os);
4221 if (error)
4222 return (error);
4223
4224 error = dmu_object_next(os, &zc->zc_obj, B_FALSE,
4225 os->os_dsl_dataset->ds_phys->ds_prev_snap_txg);
4226
4227 dmu_objset_rele(os, FTAG);
4228 return (error);
4229 }
4230
4231 /*
4232 * inputs:
4233 * zc_name name of filesystem
4234 * zc_value prefix name for snapshot
4235 * zc_cleanup_fd cleanup-on-exit file descriptor for calling process
4236 *
4237 * outputs:
4238 */
4239 static int
4240 zfs_ioc_tmp_snapshot(zfs_cmd_t *zc)
4241 {
4242 char *snap_name;
4243 int error;
4244
4245 snap_name = kmem_asprintf("%s-%016llx", zc->zc_value,
4246 (u_longlong_t)ddi_get_lbolt64());
4247
4248 if (strlen(snap_name) >= MAXNAMELEN) {
4249 strfree(snap_name);
4250 return (E2BIG);
4251 }
4252
4253 error = dmu_objset_snapshot(zc->zc_name, snap_name, snap_name,
4254 NULL, B_FALSE, B_TRUE, zc->zc_cleanup_fd);
4255 if (error != 0) {
4256 strfree(snap_name);
4257 return (error);
4258 }
4259
4260 (void) strcpy(zc->zc_value, snap_name);
4261 strfree(snap_name);
4262 return (0);
4263 }
4264
4265 /*
4266 * inputs:
4267 * zc_name name of "to" snapshot
4268 * zc_value name of "from" snapshot
4269 * zc_cookie file descriptor to write diff data on
4270 *
4271 * outputs:
4272 * dmu_diff_record_t's to the file descriptor
4273 */
4274 static int
4275 zfs_ioc_diff(zfs_cmd_t *zc)
4276 {
4277 objset_t *fromsnap;
4278 objset_t *tosnap;
4279 file_t *fp;
4280 offset_t off;
4281 int error;
4282
4283 error = dmu_objset_hold(zc->zc_name, FTAG, &tosnap);
4284 if (error)
4285 return (error);
4286
4287 error = dmu_objset_hold(zc->zc_value, FTAG, &fromsnap);
4288 if (error) {
4289 dmu_objset_rele(tosnap, FTAG);
4290 return (error);
4291 }
4292
4293 fp = getf(zc->zc_cookie);
4294 if (fp == NULL) {
4295 dmu_objset_rele(fromsnap, FTAG);
4296 dmu_objset_rele(tosnap, FTAG);
4297 return (EBADF);
4298 }
4299
4300 off = fp->f_offset;
4301
4302 error = dmu_diff(tosnap, fromsnap, fp->f_vnode, &off);
4303
4304 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
4305 fp->f_offset = off;
4306 releasef(zc->zc_cookie);
4307
4308 dmu_objset_rele(fromsnap, FTAG);
4309 dmu_objset_rele(tosnap, FTAG);
4310 return (error);
4311 }
4312
4313 /*
4314 * Remove all ACL files in shares dir
4315 */
4316 #ifdef HAVE_SMB_SHARE
4317 static int
4318 zfs_smb_acl_purge(znode_t *dzp)
4319 {
4320 zap_cursor_t zc;
4321 zap_attribute_t zap;
4322 zfs_sb_t *zsb = ZTOZSB(dzp);
4323 int error;
4324
4325 for (zap_cursor_init(&zc, zsb->z_os, dzp->z_id);
4326 (error = zap_cursor_retrieve(&zc, &zap)) == 0;
4327 zap_cursor_advance(&zc)) {
4328 if ((error = VOP_REMOVE(ZTOV(dzp), zap.za_name, kcred,
4329 NULL, 0)) != 0)
4330 break;
4331 }
4332 zap_cursor_fini(&zc);
4333 return (error);
4334 }
4335 #endif /* HAVE_SMB_SHARE */
4336
4337 static int
4338 zfs_ioc_smb_acl(zfs_cmd_t *zc)
4339 {
4340 #ifdef HAVE_SMB_SHARE
4341 vnode_t *vp;
4342 znode_t *dzp;
4343 vnode_t *resourcevp = NULL;
4344 znode_t *sharedir;
4345 zfs_sb_t *zsb;
4346 nvlist_t *nvlist;
4347 char *src, *target;
4348 vattr_t vattr;
4349 vsecattr_t vsec;
4350 int error = 0;
4351
4352 if ((error = lookupname(zc->zc_value, UIO_SYSSPACE,
4353 NO_FOLLOW, NULL, &vp)) != 0)
4354 return (error);
4355
4356 /* Now make sure mntpnt and dataset are ZFS */
4357
4358 if (vp->v_vfsp->vfs_fstype != zfsfstype ||
4359 (strcmp((char *)refstr_value(vp->v_vfsp->vfs_resource),
4360 zc->zc_name) != 0)) {
4361 VN_RELE(vp);
4362 return (EINVAL);
4363 }
4364
4365 dzp = VTOZ(vp);
4366 zsb = ZTOZSB(dzp);
4367 ZFS_ENTER(zsb);
4368
4369 /*
4370 * Create share dir if its missing.
4371 */
4372 mutex_enter(&zsb->z_lock);
4373 if (zsb->z_shares_dir == 0) {
4374 dmu_tx_t *tx;
4375
4376 tx = dmu_tx_create(zsb->z_os);
4377 dmu_tx_hold_zap(tx, MASTER_NODE_OBJ, TRUE,
4378 ZFS_SHARES_DIR);
4379 dmu_tx_hold_zap(tx, DMU_NEW_OBJECT, FALSE, NULL);
4380 error = dmu_tx_assign(tx, TXG_WAIT);
4381 if (error) {
4382 dmu_tx_abort(tx);
4383 } else {
4384 error = zfs_create_share_dir(zsb, tx);
4385 dmu_tx_commit(tx);
4386 }
4387 if (error) {
4388 mutex_exit(&zsb->z_lock);
4389 VN_RELE(vp);
4390 ZFS_EXIT(zsb);
4391 return (error);
4392 }
4393 }
4394 mutex_exit(&zsb->z_lock);
4395
4396 ASSERT(zsb->z_shares_dir);
4397 if ((error = zfs_zget(zsb, zsb->z_shares_dir, &sharedir)) != 0) {
4398 VN_RELE(vp);
4399 ZFS_EXIT(zsb);
4400 return (error);
4401 }
4402
4403 switch (zc->zc_cookie) {
4404 case ZFS_SMB_ACL_ADD:
4405 vattr.va_mask = AT_MODE|AT_UID|AT_GID|AT_TYPE;
4406 vattr.va_mode = S_IFREG|0777;
4407 vattr.va_uid = 0;
4408 vattr.va_gid = 0;
4409
4410 vsec.vsa_mask = VSA_ACE;
4411 vsec.vsa_aclentp = &full_access;
4412 vsec.vsa_aclentsz = sizeof (full_access);
4413 vsec.vsa_aclcnt = 1;
4414
4415 error = VOP_CREATE(ZTOV(sharedir), zc->zc_string,
4416 &vattr, EXCL, 0, &resourcevp, kcred, 0, NULL, &vsec);
4417 if (resourcevp)
4418 VN_RELE(resourcevp);
4419 break;
4420
4421 case ZFS_SMB_ACL_REMOVE:
4422 error = VOP_REMOVE(ZTOV(sharedir), zc->zc_string, kcred,
4423 NULL, 0);
4424 break;
4425
4426 case ZFS_SMB_ACL_RENAME:
4427 if ((error = get_nvlist(zc->zc_nvlist_src,
4428 zc->zc_nvlist_src_size, zc->zc_iflags, &nvlist)) != 0) {
4429 VN_RELE(vp);
4430 ZFS_EXIT(zsb);
4431 return (error);
4432 }
4433 if (nvlist_lookup_string(nvlist, ZFS_SMB_ACL_SRC, &src) ||
4434 nvlist_lookup_string(nvlist, ZFS_SMB_ACL_TARGET,
4435 &target)) {
4436 VN_RELE(vp);
4437 VN_RELE(ZTOV(sharedir));
4438 ZFS_EXIT(zsb);
4439 nvlist_free(nvlist);
4440 return (error);
4441 }
4442 error = VOP_RENAME(ZTOV(sharedir), src, ZTOV(sharedir), target,
4443 kcred, NULL, 0);
4444 nvlist_free(nvlist);
4445 break;
4446
4447 case ZFS_SMB_ACL_PURGE:
4448 error = zfs_smb_acl_purge(sharedir);
4449 break;
4450
4451 default:
4452 error = EINVAL;
4453 break;
4454 }
4455
4456 VN_RELE(vp);
4457 VN_RELE(ZTOV(sharedir));
4458
4459 ZFS_EXIT(zsb);
4460
4461 return (error);
4462 #else
4463 return (ENOTSUP);
4464 #endif /* HAVE_SMB_SHARE */
4465 }
4466
4467 /*
4468 * inputs:
4469 * zc_name name of filesystem
4470 * zc_value short name of snap
4471 * zc_string user-supplied tag for this hold
4472 * zc_cookie recursive flag
4473 * zc_temphold set if hold is temporary
4474 * zc_cleanup_fd cleanup-on-exit file descriptor for calling process
4475 * zc_sendobj if non-zero, the objid for zc_name@zc_value
4476 * zc_createtxg if zc_sendobj is non-zero, snap must have zc_createtxg
4477 *
4478 * outputs: none
4479 */
4480 static int
4481 zfs_ioc_hold(zfs_cmd_t *zc)
4482 {
4483 boolean_t recursive = zc->zc_cookie;
4484 spa_t *spa;
4485 dsl_pool_t *dp;
4486 dsl_dataset_t *ds;
4487 int error;
4488 minor_t minor = 0;
4489
4490 if (snapshot_namecheck(zc->zc_value, NULL, NULL) != 0)
4491 return (EINVAL);
4492
4493 if (zc->zc_sendobj == 0) {
4494 return (dsl_dataset_user_hold(zc->zc_name, zc->zc_value,
4495 zc->zc_string, recursive, zc->zc_temphold,
4496 zc->zc_cleanup_fd));
4497 }
4498
4499 if (recursive)
4500 return (EINVAL);
4501
4502 error = spa_open(zc->zc_name, &spa, FTAG);
4503 if (error)
4504 return (error);
4505
4506 dp = spa_get_dsl(spa);
4507 rw_enter(&dp->dp_config_rwlock, RW_READER);
4508 error = dsl_dataset_hold_obj(dp, zc->zc_sendobj, FTAG, &ds);
4509 rw_exit(&dp->dp_config_rwlock);
4510 spa_close(spa, FTAG);
4511 if (error)
4512 return (error);
4513
4514 /*
4515 * Until we have a hold on this snapshot, it's possible that
4516 * zc_sendobj could've been destroyed and reused as part
4517 * of a later txg. Make sure we're looking at the right object.
4518 */
4519 if (zc->zc_createtxg != ds->ds_phys->ds_creation_txg) {
4520 dsl_dataset_rele(ds, FTAG);
4521 return (ENOENT);
4522 }
4523
4524 if (zc->zc_cleanup_fd != -1 && zc->zc_temphold) {
4525 error = zfs_onexit_fd_hold(zc->zc_cleanup_fd, &minor);
4526 if (error) {
4527 dsl_dataset_rele(ds, FTAG);
4528 return (error);
4529 }
4530 }
4531
4532 error = dsl_dataset_user_hold_for_send(ds, zc->zc_string,
4533 zc->zc_temphold);
4534 if (minor != 0) {
4535 if (error == 0) {
4536 dsl_register_onexit_hold_cleanup(ds, zc->zc_string,
4537 minor);
4538 }
4539 zfs_onexit_fd_rele(zc->zc_cleanup_fd);
4540 }
4541 dsl_dataset_rele(ds, FTAG);
4542
4543 return (error);
4544 }
4545
4546 /*
4547 * inputs:
4548 * zc_name name of dataset from which we're releasing a user hold
4549 * zc_value short name of snap
4550 * zc_string user-supplied tag for this hold
4551 * zc_cookie recursive flag
4552 *
4553 * outputs: none
4554 */
4555 static int
4556 zfs_ioc_release(zfs_cmd_t *zc)
4557 {
4558 boolean_t recursive = zc->zc_cookie;
4559
4560 if (snapshot_namecheck(zc->zc_value, NULL, NULL) != 0)
4561 return (EINVAL);
4562
4563 return (dsl_dataset_user_release(zc->zc_name, zc->zc_value,
4564 zc->zc_string, recursive));
4565 }
4566
4567 /*
4568 * inputs:
4569 * zc_name name of filesystem
4570 *
4571 * outputs:
4572 * zc_nvlist_src{_size} nvlist of snapshot holds
4573 */
4574 static int
4575 zfs_ioc_get_holds(zfs_cmd_t *zc)
4576 {
4577 nvlist_t *nvp;
4578 int error;
4579
4580 if ((error = dsl_dataset_get_holds(zc->zc_name, &nvp)) == 0) {
4581 error = put_nvlist(zc, nvp);
4582 nvlist_free(nvp);
4583 }
4584
4585 return (error);
4586 }
4587
4588 /*
4589 * inputs:
4590 * zc_guid flags (ZEVENT_NONBLOCK)
4591 *
4592 * outputs:
4593 * zc_nvlist_dst next nvlist event
4594 * zc_cookie dropped events since last get
4595 * zc_cleanup_fd cleanup-on-exit file descriptor
4596 */
4597 static int
4598 zfs_ioc_events_next(zfs_cmd_t *zc)
4599 {
4600 zfs_zevent_t *ze;
4601 nvlist_t *event = NULL;
4602 minor_t minor;
4603 uint64_t dropped = 0;
4604 int error;
4605
4606 error = zfs_zevent_fd_hold(zc->zc_cleanup_fd, &minor, &ze);
4607 if (error != 0)
4608 return (error);
4609
4610 do {
4611 error = zfs_zevent_next(ze, &event,
4612 &zc->zc_nvlist_dst_size, &dropped);
4613 if (event != NULL) {
4614 zc->zc_cookie = dropped;
4615 error = put_nvlist(zc, event);
4616 nvlist_free(event);
4617 }
4618
4619 if (zc->zc_guid & ZEVENT_NONBLOCK)
4620 break;
4621
4622 if ((error == 0) || (error != ENOENT))
4623 break;
4624
4625 error = zfs_zevent_wait(ze);
4626 if (error)
4627 break;
4628 } while (1);
4629
4630 zfs_zevent_fd_rele(zc->zc_cleanup_fd);
4631
4632 return (error);
4633 }
4634
4635 /*
4636 * outputs:
4637 * zc_cookie cleared events count
4638 */
4639 static int
4640 zfs_ioc_events_clear(zfs_cmd_t *zc)
4641 {
4642 int count;
4643
4644 zfs_zevent_drain_all(&count);
4645 zc->zc_cookie = count;
4646
4647 return 0;
4648 }
4649
4650 /*
4651 * inputs:
4652 * zc_name name of new filesystem or snapshot
4653 * zc_value full name of old snapshot
4654 *
4655 * outputs:
4656 * zc_cookie space in bytes
4657 * zc_objset_type compressed space in bytes
4658 * zc_perm_action uncompressed space in bytes
4659 */
4660 static int
4661 zfs_ioc_space_written(zfs_cmd_t *zc)
4662 {
4663 int error;
4664 dsl_dataset_t *new, *old;
4665
4666 error = dsl_dataset_hold(zc->zc_name, FTAG, &new);
4667 if (error != 0)
4668 return (error);
4669 error = dsl_dataset_hold(zc->zc_value, FTAG, &old);
4670 if (error != 0) {
4671 dsl_dataset_rele(new, FTAG);
4672 return (error);
4673 }
4674
4675 error = dsl_dataset_space_written(old, new, &zc->zc_cookie,
4676 &zc->zc_objset_type, &zc->zc_perm_action);
4677 dsl_dataset_rele(old, FTAG);
4678 dsl_dataset_rele(new, FTAG);
4679 return (error);
4680 }
4681
4682 /*
4683 * inputs:
4684 * zc_name full name of last snapshot
4685 * zc_value full name of first snapshot
4686 *
4687 * outputs:
4688 * zc_cookie space in bytes
4689 * zc_objset_type compressed space in bytes
4690 * zc_perm_action uncompressed space in bytes
4691 */
4692 static int
4693 zfs_ioc_space_snaps(zfs_cmd_t *zc)
4694 {
4695 int error;
4696 dsl_dataset_t *new, *old;
4697
4698 error = dsl_dataset_hold(zc->zc_name, FTAG, &new);
4699 if (error != 0)
4700 return (error);
4701 error = dsl_dataset_hold(zc->zc_value, FTAG, &old);
4702 if (error != 0) {
4703 dsl_dataset_rele(new, FTAG);
4704 return (error);
4705 }
4706
4707 error = dsl_dataset_space_wouldfree(old, new, &zc->zc_cookie,
4708 &zc->zc_objset_type, &zc->zc_perm_action);
4709 dsl_dataset_rele(old, FTAG);
4710 dsl_dataset_rele(new, FTAG);
4711 return (error);
4712 }
4713
4714 /*
4715 * pool create, destroy, and export don't log the history as part of
4716 * zfsdev_ioctl, but rather zfs_ioc_pool_create, and zfs_ioc_pool_export
4717 * do the logging of those commands.
4718 */
4719 static zfs_ioc_vec_t zfs_ioc_vec[] = {
4720 { zfs_ioc_pool_create, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4721 POOL_CHECK_NONE },
4722 { zfs_ioc_pool_destroy, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4723 POOL_CHECK_NONE },
4724 { zfs_ioc_pool_import, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4725 POOL_CHECK_NONE },
4726 { zfs_ioc_pool_export, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4727 POOL_CHECK_NONE },
4728 { zfs_ioc_pool_configs, zfs_secpolicy_none, NO_NAME, B_FALSE,
4729 POOL_CHECK_NONE },
4730 { zfs_ioc_pool_stats, zfs_secpolicy_read, POOL_NAME, B_FALSE,
4731 POOL_CHECK_NONE },
4732 { zfs_ioc_pool_tryimport, zfs_secpolicy_config, NO_NAME, B_FALSE,
4733 POOL_CHECK_NONE },
4734 { zfs_ioc_pool_scan, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4735 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4736 { zfs_ioc_pool_freeze, zfs_secpolicy_config, NO_NAME, B_FALSE,
4737 POOL_CHECK_READONLY },
4738 { zfs_ioc_pool_upgrade, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4739 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4740 { zfs_ioc_pool_get_history, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4741 POOL_CHECK_NONE },
4742 { zfs_ioc_vdev_add, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4743 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4744 { zfs_ioc_vdev_remove, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4745 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4746 { zfs_ioc_vdev_set_state, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4747 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4748 { zfs_ioc_vdev_attach, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4749 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4750 { zfs_ioc_vdev_detach, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4751 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4752 { zfs_ioc_vdev_setpath, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4753 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4754 { zfs_ioc_vdev_setfru, zfs_secpolicy_config, POOL_NAME, B_FALSE,
4755 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4756 { zfs_ioc_objset_stats, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4757 POOL_CHECK_SUSPENDED },
4758 { zfs_ioc_objset_zplprops, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4759 POOL_CHECK_NONE },
4760 { zfs_ioc_dataset_list_next, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4761 POOL_CHECK_SUSPENDED },
4762 { zfs_ioc_snapshot_list_next, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4763 POOL_CHECK_SUSPENDED },
4764 { zfs_ioc_set_prop, zfs_secpolicy_none, DATASET_NAME, B_TRUE,
4765 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4766 { zfs_ioc_create_minor, zfs_secpolicy_config, DATASET_NAME, B_FALSE,
4767 POOL_CHECK_NONE },
4768 { zfs_ioc_remove_minor, zfs_secpolicy_config, DATASET_NAME, B_FALSE,
4769 POOL_CHECK_NONE },
4770 { zfs_ioc_create, zfs_secpolicy_create, DATASET_NAME, B_TRUE,
4771 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4772 { zfs_ioc_destroy, zfs_secpolicy_destroy, DATASET_NAME, B_TRUE,
4773 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4774 { zfs_ioc_rollback, zfs_secpolicy_rollback, DATASET_NAME, B_TRUE,
4775 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4776 { zfs_ioc_rename, zfs_secpolicy_rename, DATASET_NAME, B_TRUE,
4777 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4778 { zfs_ioc_recv, zfs_secpolicy_receive, DATASET_NAME, B_TRUE,
4779 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4780 { zfs_ioc_send, zfs_secpolicy_send, DATASET_NAME, B_FALSE,
4781 POOL_CHECK_NONE },
4782 { zfs_ioc_inject_fault, zfs_secpolicy_inject, NO_NAME, B_FALSE,
4783 POOL_CHECK_NONE },
4784 { zfs_ioc_clear_fault, zfs_secpolicy_inject, NO_NAME, B_FALSE,
4785 POOL_CHECK_NONE },
4786 { zfs_ioc_inject_list_next, zfs_secpolicy_inject, NO_NAME, B_FALSE,
4787 POOL_CHECK_NONE },
4788 { zfs_ioc_error_log, zfs_secpolicy_inject, POOL_NAME, B_FALSE,
4789 POOL_CHECK_NONE },
4790 { zfs_ioc_clear, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4791 POOL_CHECK_NONE },
4792 { zfs_ioc_promote, zfs_secpolicy_promote, DATASET_NAME, B_TRUE,
4793 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4794 { zfs_ioc_destroy_snaps_nvl, zfs_secpolicy_destroy_recursive,
4795 DATASET_NAME, B_TRUE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4796 { zfs_ioc_snapshot, zfs_secpolicy_snapshot, DATASET_NAME, B_TRUE,
4797 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4798 { zfs_ioc_dsobj_to_dsname, zfs_secpolicy_diff, POOL_NAME, B_FALSE,
4799 POOL_CHECK_NONE },
4800 { zfs_ioc_obj_to_path, zfs_secpolicy_diff, DATASET_NAME, B_FALSE,
4801 POOL_CHECK_SUSPENDED },
4802 { zfs_ioc_pool_set_props, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4803 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4804 { zfs_ioc_pool_get_props, zfs_secpolicy_read, POOL_NAME, B_FALSE,
4805 POOL_CHECK_NONE },
4806 { zfs_ioc_set_fsacl, zfs_secpolicy_fsacl, DATASET_NAME, B_TRUE,
4807 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4808 { zfs_ioc_get_fsacl, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4809 POOL_CHECK_NONE },
4810 { zfs_ioc_share, zfs_secpolicy_share, DATASET_NAME, B_FALSE,
4811 POOL_CHECK_NONE },
4812 { zfs_ioc_inherit_prop, zfs_secpolicy_inherit, DATASET_NAME, B_TRUE,
4813 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4814 { zfs_ioc_smb_acl, zfs_secpolicy_smb_acl, DATASET_NAME, B_FALSE,
4815 POOL_CHECK_NONE },
4816 { zfs_ioc_userspace_one, zfs_secpolicy_userspace_one, DATASET_NAME,
4817 B_FALSE, POOL_CHECK_NONE },
4818 { zfs_ioc_userspace_many, zfs_secpolicy_userspace_many, DATASET_NAME,
4819 B_FALSE, POOL_CHECK_NONE },
4820 { zfs_ioc_userspace_upgrade, zfs_secpolicy_userspace_upgrade,
4821 DATASET_NAME, B_FALSE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4822 { zfs_ioc_hold, zfs_secpolicy_hold, DATASET_NAME, B_TRUE,
4823 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4824 { zfs_ioc_release, zfs_secpolicy_release, DATASET_NAME, B_TRUE,
4825 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4826 { zfs_ioc_get_holds, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4827 POOL_CHECK_SUSPENDED },
4828 { zfs_ioc_objset_recvd_props, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4829 POOL_CHECK_NONE },
4830 { zfs_ioc_vdev_split, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4831 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4832 { zfs_ioc_next_obj, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4833 POOL_CHECK_NONE },
4834 { zfs_ioc_diff, zfs_secpolicy_diff, DATASET_NAME, B_FALSE,
4835 POOL_CHECK_NONE },
4836 { zfs_ioc_tmp_snapshot, zfs_secpolicy_tmp_snapshot, DATASET_NAME,
4837 B_FALSE, POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4838 { zfs_ioc_obj_to_stats, zfs_secpolicy_diff, DATASET_NAME, B_FALSE,
4839 POOL_CHECK_SUSPENDED },
4840 { zfs_ioc_events_next, zfs_secpolicy_config, NO_NAME, B_FALSE,
4841 POOL_CHECK_NONE },
4842 { zfs_ioc_events_clear, zfs_secpolicy_config, NO_NAME, B_FALSE,
4843 POOL_CHECK_NONE },
4844 { zfs_ioc_pool_reguid, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4845 POOL_CHECK_SUSPENDED | POOL_CHECK_READONLY },
4846 { zfs_ioc_space_written, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4847 POOL_CHECK_SUSPENDED },
4848 { zfs_ioc_space_snaps, zfs_secpolicy_read, DATASET_NAME, B_FALSE,
4849 POOL_CHECK_SUSPENDED },
4850 { zfs_ioc_pool_reopen, zfs_secpolicy_config, POOL_NAME, B_TRUE,
4851 POOL_CHECK_SUSPENDED },
4852 };
4853
4854 int
4855 pool_status_check(const char *name, zfs_ioc_namecheck_t type,
4856 zfs_ioc_poolcheck_t check)
4857 {
4858 spa_t *spa;
4859 int error;
4860
4861 ASSERT(type == POOL_NAME || type == DATASET_NAME);
4862
4863 if (check & POOL_CHECK_NONE)
4864 return (0);
4865
4866 error = spa_open(name, &spa, FTAG);
4867 if (error == 0) {
4868 if ((check & POOL_CHECK_SUSPENDED) && spa_suspended(spa))
4869 error = EAGAIN;
4870 else if ((check & POOL_CHECK_READONLY) && !spa_writeable(spa))
4871 error = EROFS;
4872 spa_close(spa, FTAG);
4873 }
4874 return (error);
4875 }
4876
4877 static void *
4878 zfsdev_get_state_impl(minor_t minor, enum zfsdev_state_type which)
4879 {
4880 zfsdev_state_t *zs;
4881
4882 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
4883
4884 for (zs = list_head(&zfsdev_state_list); zs != NULL;
4885 zs = list_next(&zfsdev_state_list, zs)) {
4886 if (zs->zs_minor == minor) {
4887 switch (which) {
4888 case ZST_ONEXIT: return (zs->zs_onexit);
4889 case ZST_ZEVENT: return (zs->zs_zevent);
4890 case ZST_ALL: return (zs);
4891 }
4892 }
4893 }
4894
4895 return NULL;
4896 }
4897
4898 void *
4899 zfsdev_get_state(minor_t minor, enum zfsdev_state_type which)
4900 {
4901 void *ptr;
4902
4903 mutex_enter(&zfsdev_state_lock);
4904 ptr = zfsdev_get_state_impl(minor, which);
4905 mutex_exit(&zfsdev_state_lock);
4906
4907 return ptr;
4908 }
4909
4910 minor_t
4911 zfsdev_getminor(struct file *filp)
4912 {
4913 ASSERT(filp != NULL);
4914 ASSERT(filp->private_data != NULL);
4915
4916 return (((zfsdev_state_t *)filp->private_data)->zs_minor);
4917 }
4918
4919 /*
4920 * Find a free minor number. The zfsdev_state_list is expected to
4921 * be short since it is only a list of currently open file handles.
4922 */
4923 minor_t
4924 zfsdev_minor_alloc(void)
4925 {
4926 static minor_t last_minor = 0;
4927 minor_t m;
4928
4929 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
4930
4931 for (m = last_minor + 1; m != last_minor; m++) {
4932 if (m > ZFSDEV_MAX_MINOR)
4933 m = 1;
4934 if (zfsdev_get_state_impl(m, ZST_ALL) == NULL) {
4935 last_minor = m;
4936 return (m);
4937 }
4938 }
4939
4940 return (0);
4941 }
4942
4943 static int
4944 zfsdev_state_init(struct file *filp)
4945 {
4946 zfsdev_state_t *zs;
4947 minor_t minor;
4948
4949 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
4950
4951 minor = zfsdev_minor_alloc();
4952 if (minor == 0)
4953 return (ENXIO);
4954
4955 zs = kmem_zalloc( sizeof(zfsdev_state_t), KM_SLEEP);
4956 if (zs == NULL)
4957 return (ENOMEM);
4958
4959 zs->zs_file = filp;
4960 zs->zs_minor = minor;
4961 filp->private_data = zs;
4962
4963 zfs_onexit_init((zfs_onexit_t **)&zs->zs_onexit);
4964 zfs_zevent_init((zfs_zevent_t **)&zs->zs_zevent);
4965
4966 list_insert_tail(&zfsdev_state_list, zs);
4967
4968 return (0);
4969 }
4970
4971 static int
4972 zfsdev_state_destroy(struct file *filp)
4973 {
4974 zfsdev_state_t *zs;
4975
4976 ASSERT(MUTEX_HELD(&zfsdev_state_lock));
4977 ASSERT(filp->private_data != NULL);
4978
4979 zs = filp->private_data;
4980 zfs_onexit_destroy(zs->zs_onexit);
4981 zfs_zevent_destroy(zs->zs_zevent);
4982
4983 list_remove(&zfsdev_state_list, zs);
4984 kmem_free(zs, sizeof(zfsdev_state_t));
4985
4986 return 0;
4987 }
4988
4989 static int
4990 zfsdev_open(struct inode *ino, struct file *filp)
4991 {
4992 int error;
4993
4994 mutex_enter(&zfsdev_state_lock);
4995 error = zfsdev_state_init(filp);
4996 mutex_exit(&zfsdev_state_lock);
4997
4998 return (-error);
4999 }
5000
5001 static int
5002 zfsdev_release(struct inode *ino, struct file *filp)
5003 {
5004 int error;
5005
5006 mutex_enter(&zfsdev_state_lock);
5007 error = zfsdev_state_destroy(filp);
5008 mutex_exit(&zfsdev_state_lock);
5009
5010 return (-error);
5011 }
5012
5013 static long
5014 zfsdev_ioctl(struct file *filp, unsigned cmd, unsigned long arg)
5015 {
5016 zfs_cmd_t *zc;
5017 uint_t vec;
5018 int error, rc, flag = 0;
5019
5020 vec = cmd - ZFS_IOC;
5021 if (vec >= sizeof (zfs_ioc_vec) / sizeof (zfs_ioc_vec[0]))
5022 return (-EINVAL);
5023
5024 zc = kmem_zalloc(sizeof (zfs_cmd_t), KM_SLEEP | KM_NODEBUG);
5025
5026 error = ddi_copyin((void *)arg, zc, sizeof (zfs_cmd_t), flag);
5027 if (error != 0)
5028 error = EFAULT;
5029
5030 if ((error == 0) && !(flag & FKIOCTL))
5031 error = zfs_ioc_vec[vec].zvec_secpolicy(zc, CRED());
5032
5033 /*
5034 * Ensure that all pool/dataset names are valid before we pass down to
5035 * the lower layers.
5036 */
5037 if (error == 0) {
5038 zc->zc_name[sizeof (zc->zc_name) - 1] = '\0';
5039 zc->zc_iflags = flag & FKIOCTL;
5040 switch (zfs_ioc_vec[vec].zvec_namecheck) {
5041 case POOL_NAME:
5042 if (pool_namecheck(zc->zc_name, NULL, NULL) != 0)
5043 error = EINVAL;
5044 error = pool_status_check(zc->zc_name,
5045 zfs_ioc_vec[vec].zvec_namecheck,
5046 zfs_ioc_vec[vec].zvec_pool_check);
5047 break;
5048
5049 case DATASET_NAME:
5050 if (dataset_namecheck(zc->zc_name, NULL, NULL) != 0)
5051 error = EINVAL;
5052 error = pool_status_check(zc->zc_name,
5053 zfs_ioc_vec[vec].zvec_namecheck,
5054 zfs_ioc_vec[vec].zvec_pool_check);
5055 break;
5056
5057 case NO_NAME:
5058 break;
5059 }
5060 }
5061
5062 if (error == 0)
5063 error = zfs_ioc_vec[vec].zvec_func(zc);
5064
5065 rc = ddi_copyout(zc, (void *)arg, sizeof (zfs_cmd_t), flag);
5066 if (error == 0) {
5067 if (rc != 0)
5068 error = EFAULT;
5069 if (zfs_ioc_vec[vec].zvec_his_log)
5070 zfs_log_history(zc);
5071 }
5072
5073 kmem_free(zc, sizeof (zfs_cmd_t));
5074 return (-error);
5075 }
5076
5077 #ifdef CONFIG_COMPAT
5078 static long
5079 zfsdev_compat_ioctl(struct file *filp, unsigned cmd, unsigned long arg)
5080 {
5081 return zfsdev_ioctl(filp, cmd, arg);
5082 }
5083 #else
5084 #define zfsdev_compat_ioctl NULL
5085 #endif
5086
5087 static const struct file_operations zfsdev_fops = {
5088 .open = zfsdev_open,
5089 .release = zfsdev_release,
5090 .unlocked_ioctl = zfsdev_ioctl,
5091 .compat_ioctl = zfsdev_compat_ioctl,
5092 .owner = THIS_MODULE,
5093 };
5094
5095 static struct miscdevice zfs_misc = {
5096 .minor = MISC_DYNAMIC_MINOR,
5097 .name = ZFS_DRIVER,
5098 .fops = &zfsdev_fops,
5099 };
5100
5101 static int
5102 zfs_attach(void)
5103 {
5104 int error;
5105
5106 mutex_init(&zfsdev_state_lock, NULL, MUTEX_DEFAULT, NULL);
5107 list_create(&zfsdev_state_list, sizeof (zfsdev_state_t),
5108 offsetof(zfsdev_state_t, zs_next));
5109
5110 error = misc_register(&zfs_misc);
5111 if (error) {
5112 printk(KERN_INFO "ZFS: misc_register() failed %d\n", error);
5113 return (error);
5114 }
5115
5116 return (0);
5117 }
5118
5119 static void
5120 zfs_detach(void)
5121 {
5122 int error;
5123
5124 error = misc_deregister(&zfs_misc);
5125 if (error)
5126 printk(KERN_INFO "ZFS: misc_deregister() failed %d\n", error);
5127
5128 mutex_destroy(&zfsdev_state_lock);
5129 list_destroy(&zfsdev_state_list);
5130 }
5131
5132 uint_t zfs_fsyncer_key;
5133 extern uint_t rrw_tsd_key;
5134
5135 #ifdef DEBUG
5136 #define ZFS_DEBUG_STR " (DEBUG mode)"
5137 #else
5138 #define ZFS_DEBUG_STR ""
5139 #endif
5140
5141 int
5142 _init(void)
5143 {
5144 int error;
5145
5146 spa_init(FREAD | FWRITE);
5147 zfs_init();
5148
5149 if ((error = zvol_init()) != 0)
5150 goto out1;
5151
5152 if ((error = zfs_attach()) != 0)
5153 goto out2;
5154
5155 tsd_create(&zfs_fsyncer_key, NULL);
5156 tsd_create(&rrw_tsd_key, NULL);
5157
5158 printk(KERN_NOTICE "ZFS: Loaded module v%s-%s%s, "
5159 "ZFS pool version %s, ZFS filesystem version %s\n",
5160 ZFS_META_VERSION, ZFS_META_RELEASE, ZFS_DEBUG_STR,
5161 SPA_VERSION_STRING, ZPL_VERSION_STRING);
5162
5163 return (0);
5164
5165 out2:
5166 (void) zvol_fini();
5167 out1:
5168 zfs_fini();
5169 spa_fini();
5170 printk(KERN_NOTICE "ZFS: Failed to Load ZFS Filesystem v%s-%s%s"
5171 ", rc = %d\n", ZFS_META_VERSION, ZFS_META_RELEASE,
5172 ZFS_DEBUG_STR, error);
5173
5174 return (error);
5175 }
5176
5177 int
5178 _fini(void)
5179 {
5180 zfs_detach();
5181 zvol_fini();
5182 zfs_fini();
5183 spa_fini();
5184
5185 tsd_destroy(&zfs_fsyncer_key);
5186 tsd_destroy(&rrw_tsd_key);
5187
5188 printk(KERN_NOTICE "ZFS: Unloaded module v%s-%s%s\n",
5189 ZFS_META_VERSION, ZFS_META_RELEASE, ZFS_DEBUG_STR);
5190
5191 return (0);
5192 }
5193
5194 #ifdef HAVE_SPL
5195 spl_module_init(_init);
5196 spl_module_exit(_fini);
5197
5198 MODULE_DESCRIPTION("ZFS");
5199 MODULE_AUTHOR(ZFS_META_AUTHOR);
5200 MODULE_LICENSE(ZFS_META_LICENSE);
5201 #endif /* HAVE_SPL */