Add `zfs allow` and `zfs unallow` support

[mirror_zfs.git] / module / zfs / zfs_ioctl.c
diff --git a/module/zfs/zfs_ioctl.c b/module/zfs/zfs_ioctl.c

index 39783e1091a41995d0352600876c47e6a284752f..c63af167af644a0745d8cb0036cbf10c1003de8f 100644 (file)
--- a/module/zfs/zfs_ioctl.c
+++ b/module/zfs/zfs_ioctl.c
@@ -24,12 +24,12 @@
   * Portions Copyright 2011 Martin Matuska
   * Portions Copyright 2012 Pawel Jakub Dawidek <pawel@dawidek.net>
   * Copyright (c) 2012, Joyent, Inc. All rights reserved.
- * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
- * Copyright (c) 2012, Joyent, Inc. All rights reserved.
- * Copyright (c) 201i3 by Delphix. All rights reserved.
+ * Copyright 2015 Nexenta Systems, Inc.  All rights reserved.
+ * Copyright (c) 2014, Joyent, Inc. All rights reserved.
+ * Copyright (c) 2011, 2015 by Delphix. All rights reserved.
   * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
   * Copyright (c) 2013 Steven Hartland. All rights reserved.
- * Copyright (c) 2014, Nexenta Systems, Inc. All rights reserved.
+ * Copyright (c) 2016 Actifio, Inc. All rights reserved.
   */
  
  /*
@@ -186,12 +186,19 @@
  #include <sys/zfeature.h>
  
  #include <linux/miscdevice.h>
+#include <linux/slab.h>
  
  #include "zfs_namecheck.h"
  #include "zfs_prop.h"
  #include "zfs_deleg.h"
  #include "zfs_comutil.h"
  
+/*
+ * Limit maximum nvlist size.  We don't want users passing in insane values
+ * for zc->zc_nvlist_src_size, since we will need to allocate that much memory.
+ */
+#define        MAX_NVLIST_SRC_SIZE     KMALLOC_MAX_SIZE
+
  kmutex_t zfsdev_state_lock;
  zfsdev_state_t *zfsdev_state_list;
  
@@ -247,55 +254,6 @@ static int zfs_fill_zplprops_root(uint64_t, nvlist_t *, nvlist_t *,
  int zfs_set_prop_nvlist(const char *, zprop_source_t, nvlist_t *, nvlist_t *);
  static int get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp);
  
-#if defined(HAVE_DECLARE_EVENT_CLASS)
-void
-__dprintf(const char *file, const char *func, int line, const char *fmt, ...)
-{
-       const char *newfile;
-       size_t size = 4096;
-       char *buf = kmem_alloc(size, KM_SLEEP);
-       char *nl;
-       va_list adx;
-
-       /*
-        * Get rid of annoying prefix to filename.
-        */
-       newfile = strrchr(file, '/');
-       if (newfile != NULL) {
-               newfile = newfile + 1; /* Get rid of leading / */
-       } else {
-               newfile = file;
-       }
-
-       va_start(adx, fmt);
-       (void) vsnprintf(buf, size, fmt, adx);
-       va_end(adx);
-
-       /*
-        * Get rid of trailing newline.
-        */
-       nl = strrchr(buf, '\n');
-       if (nl != NULL)
-               *nl = '\0';
-
-       /*
-        * To get this data enable the zfs__dprintf trace point as shown:
-        *
-        * # Enable zfs__dprintf tracepoint, clear the tracepoint ring buffer
-        * $ echo 1 > /sys/module/zfs/parameters/zfs_flags
-        * $ echo 1 > /sys/kernel/debug/tracing/events/zfs/enable
-        * $ echo 0 > /sys/kernel/debug/tracing/trace
-        *
-        * # Dump the ring buffer.
-        * $ cat /sys/kernel/debug/tracing/trace
-        */
-       DTRACE_PROBE4(zfs__dprintf,
-           char *, newfile, char *, func, int, line, char *, buf);
-
-       kmem_free(buf, size);
-}
-#endif /* HAVE_DECLARE_EVENT_CLASS */
-
  static void
  history_str_free(char *buf)
  {
@@ -641,12 +599,14 @@ zfs_secpolicy_setprop(const char *dsname, zfs_prop_t prop, nvpair_t *propval,
                 break;
  
         case ZFS_PROP_QUOTA:
+       case ZFS_PROP_FILESYSTEM_LIMIT:
+       case ZFS_PROP_SNAPSHOT_LIMIT:
                 if (!INGLOBALZONE(curproc)) {
                         uint64_t zoned;
                         char setpoint[MAXNAMELEN];
                         /*
                          * Unprivileged users are allowed to modify the
-                        * quota on things *under* (ie. contained by)
+                        * limit on things *under* (ie. contained by)
                          * the thing they own.
                          */
                         if (dsl_prop_get_integer(dsname, "zoned", &zoned,
@@ -944,7 +904,7 @@ zfs_secpolicy_promote(zfs_cmd_t *zc, nvlist_t *innvl, cred_t *cr)
                 dd = clone->ds_dir;
  
                 error = dsl_dataset_hold_obj(dd->dd_pool,
-                   dd->dd_phys->dd_origin_obj, FTAG, &origin);
+                   dsl_dir_phys(dd)->dd_origin_obj, FTAG, &origin);
                 if (error != 0) {
                         dsl_dataset_rele(clone, FTAG);
                         dsl_pool_rele(dp, FTAG);
@@ -1332,7 +1292,7 @@ get_nvlist(uint64_t nvl, uint64_t size, int iflag, nvlist_t **nvp)
         if ((error = ddi_copyin((void *)(uintptr_t)nvl, packed, size,
             iflag)) != 0) {
                 vmem_free(packed, size);
-               return (error);
+               return (SET_ERROR(EFAULT));
         }
  
         if ((error = nvlist_unpack(packed, size, &list, 0)) != 0) {
@@ -1447,9 +1407,9 @@ zfs_sb_hold(const char *name, void *tag, zfs_sb_t **zsbp, boolean_t writer)
         int error = 0;
  
         if (get_zfs_sb(name, zsbp) != 0)
-               error = zfs_sb_create(name, zsbp);
+               error = zfs_sb_create(name, NULL, zsbp);
         if (error == 0) {
-               rrw_enter(&(*zsbp)->z_teardown_lock, (writer) ? RW_WRITER :
+               rrm_enter(&(*zsbp)->z_teardown_lock, (writer) ? RW_WRITER :
                     RW_READER, tag);
                 if ((*zsbp)->z_unmounted) {
                         /*
@@ -1457,7 +1417,7 @@ zfs_sb_hold(const char *name, void *tag, zfs_sb_t **zsbp, boolean_t writer)
                          * thread should be just about to disassociate the
                          * objset from the zsb.
                          */
-                       rrw_exit(&(*zsbp)->z_teardown_lock, tag);
+                       rrm_exit(&(*zsbp)->z_teardown_lock, tag);
                         return (SET_ERROR(EBUSY));
                 }
         }
@@ -1467,7 +1427,7 @@ zfs_sb_hold(const char *name, void *tag, zfs_sb_t **zsbp, boolean_t writer)
  static void
  zfs_sb_rele(zfs_sb_t *zsb, void *tag)
  {
-       rrw_exit(&zsb->z_teardown_lock, tag);
+       rrm_exit(&zsb->z_teardown_lock, tag);
  
         if (zsb->z_sb) {
                 deactivate_super(zsb->z_sb);
@@ -1547,8 +1507,7 @@ zfs_ioc_pool_destroy(zfs_cmd_t *zc)
         int error;
         zfs_log_history(zc);
         error = spa_destroy(zc->zc_name);
-       if (error == 0)
-               zvol_remove_minors(zc->zc_name);
+
         return (error);
  }
  
@@ -1584,9 +1543,7 @@ zfs_ioc_pool_import(zfs_cmd_t *zc)
         }
  
         nvlist_free(config);
-
-       if (props)
-               nvlist_free(props);
+       nvlist_free(props);
  
         return (error);
  }
@@ -1600,8 +1557,7 @@ zfs_ioc_pool_export(zfs_cmd_t *zc)
  
         zfs_log_history(zc);
         error = spa_export(zc->zc_name, NULL, force, hardforce);
-       if (error == 0)
-               zvol_remove_minors(zc->zc_name);
+
         return (error);
  }
  
@@ -2390,7 +2346,7 @@ zfs_prop_set_special(const char *dsname, zprop_source_t source,
         const char *propname = nvpair_name(pair);
         zfs_prop_t prop = zfs_name_to_prop(propname);
         uint64_t intval;
-       int err;
+       int err = -1;
  
         if (prop == ZPROP_INVAL) {
                 if (zfs_prop_userquota(propname))
@@ -2417,6 +2373,21 @@ zfs_prop_set_special(const char *dsname, zprop_source_t source,
         case ZFS_PROP_REFQUOTA:
                 err = dsl_dataset_set_refquota(dsname, source, intval);
                 break;
+       case ZFS_PROP_FILESYSTEM_LIMIT:
+       case ZFS_PROP_SNAPSHOT_LIMIT:
+               if (intval == UINT64_MAX) {
+                       /* clearing the limit, just do it */
+                       err = 0;
+               } else {
+                       err = dsl_dir_activate_fs_ss_limit(dsname);
+               }
+               /*
+                * Set err to -1 to force the zfs_set_prop_nvlist code down the
+                * default path to set the value in the nvlist.
+                */
+               if (err == 0)
+                       err = -1;
+               break;
         case ZFS_PROP_RESERVATION:
                 err = dsl_dir_set_reservation(dsname, source, intval);
                 break;
@@ -2427,7 +2398,7 @@ zfs_prop_set_special(const char *dsname, zprop_source_t source,
                 err = zvol_set_volsize(dsname, intval);
                 break;
         case ZFS_PROP_SNAPDEV:
-               err = zvol_set_snapdev(dsname, intval);
+               err = zvol_set_snapdev(dsname, source, intval);
                 break;
         case ZFS_PROP_VERSION:
         {
@@ -3184,7 +3155,7 @@ zfs_ioc_create(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
                         volblocksize = zfs_prop_default_numeric(
                             ZFS_PROP_VOLBLOCKSIZE);
  
-               if ((error = zvol_check_volblocksize(
+               if ((error = zvol_check_volblocksize(fsname,
                     volblocksize)) != 0 ||
                     (error = zvol_check_volsize(volsize,
                     volblocksize)) != 0)
@@ -3218,15 +3189,26 @@ zfs_ioc_create(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
         if (error == 0) {
                 error = zfs_set_prop_nvlist(fsname, ZPROP_SRC_LOCAL,
                     nvprops, outnvl);
-               if (error != 0)
-                       (void) dsl_destroy_head(fsname);
-       }
-
-#ifdef _KERNEL
-       if (error == 0 && type == DMU_OST_ZVOL)
-               zvol_create_minors(fsname);
-#endif
+               if (error != 0) {
+                       spa_t *spa;
+                       int error2;
  
+                       /*
+                        * Volumes will return EBUSY and cannot be destroyed
+                        * until all asynchronous minor handling has completed.
+                        * Wait for the spa_zvol_taskq to drain then retry.
+                        */
+                       error2 = dsl_destroy_head(fsname);
+                       while ((error2 == EBUSY) && (type == DMU_OST_ZVOL)) {
+                               error2 = spa_open(fsname, &spa, FTAG);
+                               if (error2 == 0) {
+                                       taskq_wait(spa->spa_zvol_taskq);
+                                       spa_close(spa, FTAG);
+                               }
+                               error2 = dsl_destroy_head(fsname);
+                       }
+               }
+       }
         return (error);
  }
  
@@ -3269,12 +3251,6 @@ zfs_ioc_clone(const char *fsname, nvlist_t *innvl, nvlist_t *outnvl)
                 if (error != 0)
                         (void) dsl_destroy_head(fsname);
         }
-
-#ifdef _KERNEL
-       if (error == 0)
-               zvol_create_minors(fsname);
-#endif
-
         return (error);
  }
  
@@ -3337,11 +3313,6 @@ zfs_ioc_snapshot(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
  
         error = dsl_dataset_snapshot(snaps, props, outnvl);
  
-#ifdef _KERNEL
-       if (error == 0)
-               zvol_create_minors(poolname);
-#endif
-
         return (error);
  }
  
@@ -3393,37 +3364,20 @@ zfs_ioc_log_history(const char *unused, nvlist_t *innvl, nvlist_t *outnvl)
   * This function is best-effort.  Callers must deal gracefully if it
   * remains mounted (or is remounted after this call).
   *
- * XXX: This function should detect a failure to unmount a snapdir of a dataset
- * and return the appropriate error code when it is mounted. Its Illumos and
- * FreeBSD counterparts do this. We do not do this on Linux because there is no
- * clear way to access the mount information that FreeBSD and Illumos use to
- * distinguish between things with mounted snapshot directories, and things
- * without mounted snapshot directories, which include zvols. Returning a
- * failure for the latter causes `zfs destroy` to fail on zvol snapshots.
+ * Returns 0 if the argument is not a snapshot, or it is not currently a
+ * filesystem, or we were able to unmount it.  Returns error code otherwise.
   */
  int
  zfs_unmount_snap(const char *snapname)
  {
-       zfs_sb_t *zsb = NULL;
-       char *dsname;
-       char *fullname;
-       char *ptr;
+       int err;
  
-       if ((ptr = strchr(snapname, '@')) == NULL)
+       if (strchr(snapname, '@') == NULL)
                 return (0);
  
-       dsname = kmem_alloc(ptr - snapname + 1, KM_SLEEP);
-       strlcpy(dsname, snapname, ptr - snapname + 1);
-       fullname = strdup(snapname);
-
-       if (zfs_sb_hold(dsname, FTAG, &zsb, B_FALSE) == 0) {
-               ASSERT(!dsl_pool_config_held(dmu_objset_pool(zsb->z_os)));
-               (void) zfsctl_unmount_snapshot(zsb, fullname, MNT_FORCE);
-               zfs_sb_rele(zsb, FTAG);
-       }
-
-       kmem_free(dsname, ptr - snapname + 1);
-       strfree(fullname);
+       err = zfsctl_snapshot_unmount((char *)snapname, MNT_FORCE);
+       if (err != 0 && err != ENOENT)
+               return (SET_ERROR(err));
  
         return (0);
  }
@@ -3484,7 +3438,6 @@ zfs_ioc_destroy_snaps(const char *poolname, nvlist_t *innvl, nvlist_t *outnvl)
         for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL;
             pair = nvlist_next_nvpair(snaps, pair)) {
                 (void) zfs_unmount_snap(nvpair_name(pair));
-               (void) zvol_remove_minor(nvpair_name(pair));
         }
  
         return (dsl_destroy_snapshots_nvl(snaps, defer, outnvl));
@@ -3610,8 +3563,7 @@ zfs_ioc_destroy(zfs_cmd_t *zc)
                 err = dsl_destroy_snapshot(zc->zc_name, zc->zc_defer_destroy);
         else
                 err = dsl_destroy_head(zc->zc_name);
-       if (zc->zc_objset_type == DMU_OST_ZVOL && err == 0)
-               (void) zvol_remove_minor(zc->zc_name);
+
         return (err);
  }
  
@@ -3773,8 +3725,7 @@ zfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
                  * the SPA supports it. We ignore any errors here since
                  * we'll catch them later.
                  */
-               if (nvpair_type(pair) == DATA_TYPE_UINT64 &&
-                   nvpair_value_uint64(pair, &intval) == 0) {
+               if (nvpair_value_uint64(pair, &intval) == 0) {
                         if (intval >= ZIO_COMPRESS_GZIP_1 &&
                             intval <= ZIO_COMPRESS_GZIP_9 &&
                             zfs_earlier_version(dsname,
@@ -3825,6 +3776,43 @@ zfs_check_settable(const char *dsname, nvpair_t *pair, cred_t *cr)
                         return (SET_ERROR(ENOTSUP));
                 break;
  
+       case ZFS_PROP_VOLBLOCKSIZE:
+       case ZFS_PROP_RECORDSIZE:
+               /* Record sizes above 128k need the feature to be enabled */
+               if (nvpair_value_uint64(pair, &intval) == 0 &&
+                   intval > SPA_OLD_MAXBLOCKSIZE) {
+                       spa_t *spa;
+
+                       /*
+                        * If this is a bootable dataset then
+                        * the we don't allow large (>128K) blocks,
+                        * because GRUB doesn't support them.
+                        */
+                       if (zfs_is_bootfs(dsname) &&
+                           intval > SPA_OLD_MAXBLOCKSIZE) {
+                               return (SET_ERROR(ERANGE));
+                       }
+
+                       /*
+                        * We don't allow setting the property above 1MB,
+                        * unless the tunable has been changed.
+                        */
+                       if (intval > zfs_max_recordsize ||
+                           intval > SPA_MAXBLOCKSIZE)
+                               return (SET_ERROR(ERANGE));
+
+                       if ((err = spa_open(dsname, &spa, FTAG)) != 0)
+                               return (err);
+
+                       if (!spa_feature_is_enabled(spa,
+                           SPA_FEATURE_LARGE_BLOCKS)) {
+                               spa_close(spa, FTAG);
+                               return (SET_ERROR(ENOTSUP));
+                       }
+                       spa_close(spa, FTAG);
+               }
+               break;
+
         case ZFS_PROP_SHARESMB:
                 if (zpl_earlier_version(dsname, ZPL_VERSION_FUID))
                         return (SET_ERROR(ENOTSUP));
@@ -4141,11 +4129,6 @@ zfs_ioc_recv(zfs_cmd_t *zc)
         }
  #endif
  
-#ifdef _KERNEL
-       if (error == 0)
-               zvol_create_minors(tofs);
-#endif
-
         /*
          * On error, restore the original props.
          */
@@ -4204,7 +4187,7 @@ out:
   * zc_fromobj  objsetid of incremental fromsnap (may be zero)
   * zc_guid     if set, estimate size of stream only.  zc_cookie is ignored.
   *             output size in zc_objset_type.
- * zc_flags    if =1, WRITE_EMBEDDED records are permitted
+ * zc_flags    lzc_send_flags
   *
   * outputs:
   * zc_objset_type      estimated size, if zc_guid is set
@@ -4216,6 +4199,7 @@ zfs_ioc_send(zfs_cmd_t *zc)
         offset_t off;
         boolean_t estimate = (zc->zc_guid != 0);
         boolean_t embedok = (zc->zc_flags & 0x1);
+       boolean_t large_block_ok = (zc->zc_flags & 0x2);
  
         if (zc->zc_obj != 0) {
                 dsl_pool_t *dp;
@@ -4232,7 +4216,8 @@ zfs_ioc_send(zfs_cmd_t *zc)
                 }
  
                 if (dsl_dir_is_clone(tosnap->ds_dir))
-                       zc->zc_fromobj = tosnap->ds_dir->dd_phys->dd_origin_obj;
+                       zc->zc_fromobj =
+                           dsl_dir_phys(tosnap->ds_dir)->dd_origin_obj;
                 dsl_dataset_rele(tosnap, FTAG);
                 dsl_pool_rele(dp, FTAG);
         }
@@ -4276,7 +4261,8 @@ zfs_ioc_send(zfs_cmd_t *zc)
  
                 off = fp->f_offset;
                 error = dmu_send_obj(zc->zc_name, zc->zc_sendobj,
-                   zc->zc_fromobj, embedok, zc->zc_cookie, fp->f_vnode, &off);
+                   zc->zc_fromobj, embedok, large_block_ok,
+                   zc->zc_cookie, fp->f_vnode, &off);
  
                 if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
                         fp->f_offset = off;
@@ -4669,8 +4655,7 @@ zfs_ioc_next_obj(zfs_cmd_t *zc)
         if (error != 0)
                 return (error);
  
-       error = dmu_object_next(os, &zc->zc_obj, B_FALSE,
-           os->os_dsl_dataset->ds_phys->ds_prev_snap_txg);
+       error = dmu_object_next(os, &zc->zc_obj, B_FALSE, 0);
  
         dmu_objset_rele(os, FTAG);
         return (error);
@@ -4859,6 +4844,7 @@ zfs_ioc_smb_acl(zfs_cmd_t *zc)
                 if ((error = get_nvlist(zc->zc_nvlist_src,
                     zc->zc_nvlist_src_size, zc->zc_iflags, &nvlist)) != 0) {
                         VN_RELE(vp);
+                       VN_RELE(ZTOV(sharedir));
                         ZFS_EXIT(zsb);
                         return (error);
                 }
@@ -4911,6 +4897,7 @@ zfs_ioc_smb_acl(zfs_cmd_t *zc)
  static int
  zfs_ioc_hold(const char *pool, nvlist_t *args, nvlist_t *errlist)
  {
+       nvpair_t *pair;
         nvlist_t *holds;
         int cleanup_fd = -1;
         int error;
@@ -4920,6 +4907,19 @@ zfs_ioc_hold(const char *pool, nvlist_t *args, nvlist_t *errlist)
         if (error != 0)
                 return (SET_ERROR(EINVAL));
  
+       /* make sure the user didn't pass us any invalid (empty) tags */
+       for (pair = nvlist_next_nvpair(holds, NULL); pair != NULL;
+           pair = nvlist_next_nvpair(holds, pair)) {
+               char *htag;
+
+               error = nvpair_value_string(pair, &htag);
+               if (error != 0)
+                       return (SET_ERROR(error));
+
+               if (strlen(htag) == 0)
+                       return (SET_ERROR(EINVAL));
+       }
+
         if (nvlist_lookup_int32(args, "cleanup_fd", &cleanup_fd) == 0) {
                 error = zfs_onexit_fd_hold(cleanup_fd, &minor);
                 if (error != 0)
@@ -5117,11 +5117,19 @@ zfs_ioc_space_snaps(const char *lastsnap, nvlist_t *innvl, nvlist_t *outnvl)
                 return (error);
  
         error = dsl_dataset_hold(dp, lastsnap, FTAG, &new);
+       if (error == 0 && !new->ds_is_snapshot) {
+               dsl_dataset_rele(new, FTAG);
+               error = SET_ERROR(EINVAL);
+       }
         if (error != 0) {
                 dsl_pool_rele(dp, FTAG);
                 return (error);
         }
         error = dsl_dataset_hold(dp, firstsnap, FTAG, &old);
+       if (error == 0 && !old->ds_is_snapshot) {
+               dsl_dataset_rele(old, FTAG);
+               error = SET_ERROR(EINVAL);
+       }
         if (error != 0) {
                 dsl_dataset_rele(new, FTAG);
                 dsl_pool_rele(dp, FTAG);
@@ -5142,6 +5150,8 @@ zfs_ioc_space_snaps(const char *lastsnap, nvlist_t *innvl, nvlist_t *outnvl)
   * innvl: {
   *     "fd" -> file descriptor to write stream to (int32)
   *     (optional) "fromsnap" -> full snap name to send an incremental from
+ *     (optional) "largeblockok" -> (value ignored)
+ *         indicates that blocks > 128KB are permitted
   *     (optional) "embedok" -> (value ignored)
   *         presence indicates DRR_WRITE_EMBEDDED records are permitted
   * }
@@ -5157,6 +5167,7 @@ zfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
         char *fromname = NULL;
         int fd;
         file_t *fp;
+       boolean_t largeblockok;
         boolean_t embedok;
  
         error = nvlist_lookup_int32(innvl, "fd", &fd);
@@ -5165,13 +5176,15 @@ zfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
  
         (void) nvlist_lookup_string(innvl, "fromsnap", &fromname);
  
+       largeblockok = nvlist_exists(innvl, "largeblockok");
         embedok = nvlist_exists(innvl, "embedok");
  
         if ((fp = getf(fd)) == NULL)
                 return (SET_ERROR(EBADF));
  
         off = fp->f_offset;
-       error = dmu_send(snapname, fromname, embedok, fd, fp->f_vnode, &off);
+       error = dmu_send(snapname, fromname, embedok, largeblockok,
+           fd, fp->f_vnode, &off);
  
         if (VOP_SEEK(fp->f_vnode, fp->f_offset, &off, NULL) == 0)
                 fp->f_offset = off;
@@ -5185,7 +5198,8 @@ zfs_ioc_send_new(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
   * of bytes that will be written to the fd supplied to zfs_ioc_send_new().
   *
   * innvl: {
- *     (optional) "fromsnap" -> full snap name to send an incremental from
+ *     (optional) "from" -> full snap or bookmark name to send an incremental
+ *                          from
   * }
   *
   * outnvl: {
@@ -5196,7 +5210,6 @@ static int
  zfs_ioc_send_space(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
  {
         dsl_pool_t *dp;
-       dsl_dataset_t *fromsnap = NULL;
         dsl_dataset_t *tosnap;
         int error;
         char *fromname;
@@ -5212,27 +5225,55 @@ zfs_ioc_send_space(const char *snapname, nvlist_t *innvl, nvlist_t *outnvl)
                 return (error);
         }
  
-       error = nvlist_lookup_string(innvl, "fromsnap", &fromname);
+       error = nvlist_lookup_string(innvl, "from", &fromname);
         if (error == 0) {
-               error = dsl_dataset_hold(dp, fromname, FTAG, &fromsnap);
-               if (error != 0) {
-                       dsl_dataset_rele(tosnap, FTAG);
-                       dsl_pool_rele(dp, FTAG);
-                       return (error);
+               if (strchr(fromname, '@') != NULL) {
+                       /*
+                        * If from is a snapshot, hold it and use the more
+                        * efficient dmu_send_estimate to estimate send space
+                        * size using deadlists.
+                        */
+                       dsl_dataset_t *fromsnap;
+                       error = dsl_dataset_hold(dp, fromname, FTAG, &fromsnap);
+                       if (error != 0)
+                               goto out;
+                       error = dmu_send_estimate(tosnap, fromsnap, &space);
+                       dsl_dataset_rele(fromsnap, FTAG);
+               } else if (strchr(fromname, '#') != NULL) {
+                       /*
+                        * If from is a bookmark, fetch the creation TXG of the
+                        * snapshot it was created from and use that to find
+                        * blocks that were born after it.
+                        */
+                       zfs_bookmark_phys_t frombm;
+
+                       error = dsl_bookmark_lookup(dp, fromname, tosnap,
+                           &frombm);
+                       if (error != 0)
+                               goto out;
+                       error = dmu_send_estimate_from_txg(tosnap,
+                           frombm.zbm_creation_txg, &space);
+               } else {
+                       /*
+                        * from is not properly formatted as a snapshot or
+                        * bookmark
+                        */
+                       error = SET_ERROR(EINVAL);
+                       goto out;
                 }
+       } else {
+               // If estimating the size of a full send, use dmu_send_estimate
+               error = dmu_send_estimate(tosnap, NULL, &space);
         }
  
-       error = dmu_send_estimate(tosnap, fromsnap, &space);
         fnvlist_add_uint64(outnvl, "space", space);
  
-       if (fromsnap != NULL)
-               dsl_dataset_rele(fromsnap, FTAG);
+out:
         dsl_dataset_rele(tosnap, FTAG);
         dsl_pool_rele(dp, FTAG);
         return (error);
  }
  
-
  static zfs_ioc_vec_t zfs_ioc_vec[ZFS_IOC_LAST - ZFS_IOC_FIRST];
  
  static void
@@ -5600,13 +5641,35 @@ zfsdev_get_state(minor_t minor, enum zfsdev_state_type which)
         return (ptr);
  }
  
-minor_t
-zfsdev_getminor(struct file *filp)
+int
+zfsdev_getminor(struct file *filp, minor_t *minorp)
  {
+       zfsdev_state_t *zs, *fpd;
+
         ASSERT(filp != NULL);
-       ASSERT(filp->private_data != NULL);
+       ASSERT(!MUTEX_HELD(&zfsdev_state_lock));
+
+       fpd = filp->private_data;
+       if (fpd == NULL)
+               return (EBADF);
+
+       mutex_enter(&zfsdev_state_lock);
  
-       return (((zfsdev_state_t *)filp->private_data)->zs_minor);
+       for (zs = zfsdev_state_list; zs != NULL; zs = zs->zs_next) {
+
+               if (zs->zs_minor == -1)
+                       continue;
+
+               if (fpd == zs) {
+                       *minorp = fpd->zs_minor;
+                       mutex_exit(&zfsdev_state_lock);
+                       return (0);
+               }
+       }
+
+       mutex_exit(&zfsdev_state_lock);
+
+       return (EBADF);
  }
  
  /*
@@ -5756,7 +5819,23 @@ zfsdev_ioctl(struct file *filp, unsigned cmd, unsigned long arg)
         }
  
         zc->zc_iflags = flag & FKIOCTL;
-       if (zc->zc_nvlist_src_size != 0) {
+       if (zc->zc_nvlist_src_size > MAX_NVLIST_SRC_SIZE) {
+               /*
+                * Make sure the user doesn't pass in an insane value for
+                * zc_nvlist_src_size.  We have to check, since we will end
+                * up allocating that much memory inside of get_nvlist().  This
+                * prevents a nefarious user from allocating tons of kernel
+                * memory.
+                *
+                * Also, we return EINVAL instead of ENOMEM here.  The reason
+                * being that returning ENOMEM from an ioctl() has a special
+                * connotation; that the user's size value is too small and
+                * needs to be expanded to hold the nvlist.  See
+                * zcmd_expand_dst_nvlist() for details.
+                */
+               error = SET_ERROR(EINVAL);      /* User's size too big */
+
+       } else if (zc->zc_nvlist_src_size != 0) {
                 error = get_nvlist(zc->zc_nvlist_src, zc->zc_nvlist_src_size,
                     zc->zc_iflags, &innvl);
                 if (error != 0)
@@ -5790,8 +5869,11 @@ zfsdev_ioctl(struct file *filp, unsigned cmd, unsigned long arg)
         }
  
  
-       if (error == 0 && !(flag & FKIOCTL))
+       if (error == 0 && !(flag & FKIOCTL)) {
+               cookie = spl_fstrans_mark();
                 error = vec->zvec_secpolicy(zc, innvl, CRED());
+               spl_fstrans_unmark(cookie);
+       }
  
         if (error != 0)
                 goto out;
@@ -5927,13 +6009,9 @@ zfs_attach(void)
  static void
  zfs_detach(void)
  {
-       int error;
         zfsdev_state_t *zs, *zsprev = NULL;
  
-       error = misc_deregister(&zfs_misc);
-       if (error != 0)
-               printk(KERN_INFO "ZFS: misc_deregister() failed %d\n", error);
-
+       misc_deregister(&zfs_misc);
         mutex_destroy(&zfsdev_state_lock);
  
         for (zs = zfsdev_state_list; zs != NULL; zs = zs->zs_next) {
@@ -5963,23 +6041,23 @@ _init(void)
  {
         int error;
  
-       error = vn_set_pwd("/");
+       error = -vn_set_pwd("/");
         if (error) {
                 printk(KERN_NOTICE
                     "ZFS: Warning unable to set pwd to '/': %d\n", error);
                 return (error);
         }
  
+       if ((error = -zvol_init()) != 0)
+               return (error);
+
         spa_init(FREAD | FWRITE);
         zfs_init();
  
-       if ((error = zvol_init()) != 0)
-               goto out1;
-
         zfs_ioctl_init();
  
         if ((error = zfs_attach()) != 0)
-               goto out2;
+               goto out;
  
         tsd_create(&zfs_fsyncer_key, NULL);
         tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
@@ -5995,11 +6073,10 @@ _init(void)
  
         return (0);
  
-out2:
-       (void) zvol_fini();
-out1:
+out:
         zfs_fini();
         spa_fini();
+       (void) zvol_fini();
         printk(KERN_NOTICE "ZFS: Failed to Load ZFS Filesystem v%s-%s%s"
             ", rc = %d\n", ZFS_META_VERSION, ZFS_META_RELEASE,
             ZFS_DEBUG_STR, error);
@@ -6011,9 +6088,9 @@ static void __exit
  _fini(void)
  {
         zfs_detach();
-       zvol_fini();
         zfs_fini();
         spa_fini();
+       zvol_fini();
  
         tsd_destroy(&zfs_fsyncer_key);
         tsd_destroy(&rrw_tsd_key);