Add 'zpool split' coverage to the ZFS Test Suite

[mirror_zfs.git] / lib / libzfs / libzfs_pool.c
diff --git a/lib/libzfs/libzfs_pool.c b/lib/libzfs/libzfs_pool.c

index a5d2c28affe4f4a05bc615e85a891d4bc63c46d2..3fe0b9e0ee44c6968e1c0be1bc286eca1d6c2327 100644 (file)
--- a/lib/libzfs/libzfs_pool.c
+++ b/lib/libzfs/libzfs_pool.c
@@ -20,9 +20,12 @@
   */
  
  /*
+ * Copyright 2015 Nexenta Systems, Inc.  All rights reserved.
   * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
- * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
- * Copyright (c) 2013 by Delphix. All rights reserved.
+ * Copyright (c) 2011, 2014 by Delphix. All rights reserved.
+ * Copyright 2016 Igor Kozhukhov <ikozhukhov@gmail.com>
+ * Copyright (c) 2017 Datto Inc.
+ * Copyright (c) 2017 Open-E, Inc. All Rights Reserved.
   */
  
  #include <ctype.h>
@@ -38,6 +41,7 @@
  #include <zone.h>
  #include <sys/stat.h>
  #include <sys/efi_partition.h>
+#include <sys/systeminfo.h>
  #include <sys/vtoc.h>
  #include <sys/zfs_ioctl.h>
  #include <dlfcn.h>
@@ -49,6 +53,7 @@
  #include "zfeature_common.h"
  
  static int read_efi_label(nvlist_t *config, diskaddr_t *sb);
+static boolean_t zpool_vdev_is_interior(const char *name);
  
  typedef struct prop_flags {
         int create:1;   /* Validate property on creation */
@@ -108,7 +113,7 @@ zpool_props_refresh(zpool_handle_t *zhp)
         return (0);
  }
  
-static char *
+static const char *
  zpool_get_prop_string(zpool_handle_t *zhp, zpool_prop_t prop,
      zprop_source_t *src)
  {
@@ -176,12 +181,10 @@ zpool_get_prop_int(zpool_handle_t *zhp, zpool_prop_t prop, zprop_source_t *src)
  /*
   * Map VDEV STATE to printed strings.
   */
-char *
+const char *
  zpool_state_to_name(vdev_state_t state, vdev_aux_t aux)
  {
         switch (state) {
-       default:
-               break;
         case VDEV_STATE_CLOSED:
         case VDEV_STATE_OFFLINE:
                 return (gettext("OFFLINE"));
@@ -200,6 +203,9 @@ zpool_state_to_name(vdev_state_t state, vdev_aux_t aux)
                 return (gettext("DEGRADED"));
         case VDEV_STATE_HEALTHY:
                 return (gettext("ONLINE"));
+
+       default:
+               break;
         }
  
         return (gettext("UNKNOWN"));
@@ -235,22 +241,12 @@ zpool_pool_state_to_name(pool_state_t state)
         return (gettext("UNKNOWN"));
  }
  
-/*
- * API compatibility wrapper around zpool_get_prop_literal
- */
-int
-zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf, size_t len,
-    zprop_source_t *srctype)
-{
-       return (zpool_get_prop_literal(zhp, prop, buf, len, srctype, B_FALSE));
-}
-
  /*
   * Get a zpool property value for 'prop' and return the value in
   * a pre-allocated buffer.
   */
  int
-zpool_get_prop_literal(zpool_handle_t *zhp, zpool_prop_t prop, char *buf,
+zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf,
      size_t len, zprop_source_t *srctype, boolean_t literal)
  {
         uint64_t intval;
@@ -283,9 +279,7 @@ zpool_get_prop_literal(zpool_handle_t *zhp, zpool_prop_t prop, char *buf,
                                 (void) strlcpy(buf,
                                     zpool_get_prop_string(zhp, prop, &src),
                                     len);
-                               if (srctype != NULL)
-                                       *srctype = src;
-                               return (0);
+                               break;
                         }
                         /* FALLTHROUGH */
                 default:
@@ -316,24 +310,57 @@ zpool_get_prop_literal(zpool_handle_t *zhp, zpool_prop_t prop, char *buf,
                 case ZPOOL_PROP_ALLOCATED:
                 case ZPOOL_PROP_FREE:
                 case ZPOOL_PROP_FREEING:
-               case ZPOOL_PROP_EXPANDSZ:
+               case ZPOOL_PROP_LEAKED:
                 case ZPOOL_PROP_ASHIFT:
                         if (literal)
                                 (void) snprintf(buf, len, "%llu",
-                                       (u_longlong_t)intval);
+                                   (u_longlong_t)intval);
                         else
                                 (void) zfs_nicenum(intval, buf, len);
                         break;
  
+               case ZPOOL_PROP_EXPANDSZ:
+                       if (intval == 0) {
+                               (void) strlcpy(buf, "-", len);
+                       } else if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) zfs_nicebytes(intval, buf, len);
+                       }
+                       break;
+
                 case ZPOOL_PROP_CAPACITY:
-                       (void) snprintf(buf, len, "%llu%%",
-                           (u_longlong_t)intval);
+                       if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) snprintf(buf, len, "%llu%%",
+                                   (u_longlong_t)intval);
+                       }
+                       break;
+
+               case ZPOOL_PROP_FRAGMENTATION:
+                       if (intval == UINT64_MAX) {
+                               (void) strlcpy(buf, "-", len);
+                       } else if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) snprintf(buf, len, "%llu%%",
+                                   (u_longlong_t)intval);
+                       }
                         break;
  
                 case ZPOOL_PROP_DEDUPRATIO:
-                       (void) snprintf(buf, len, "%llu.%02llux",
-                           (u_longlong_t)(intval / 100),
-                           (u_longlong_t)(intval % 100));
+                       if (literal)
+                               (void) snprintf(buf, len, "%llu.%02llu",
+                                   (u_longlong_t)(intval / 100),
+                                   (u_longlong_t)(intval % 100));
+                       else
+                               (void) snprintf(buf, len, "%llu.%02llux",
+                                   (u_longlong_t)(intval / 100),
+                                   (u_longlong_t)(intval % 100));
                         break;
  
                 case ZPOOL_PROP_HEALTH:
@@ -383,6 +410,8 @@ static boolean_t
  bootfs_name_valid(const char *pool, char *bootfs)
  {
         int len = strlen(pool);
+       if (bootfs[0] == '\0')
+               return (B_TRUE);
  
         if (!zfs_name_valid(bootfs, ZFS_TYPE_FILESYSTEM|ZFS_TYPE_SNAPSHOT))
                 return (B_FALSE);
@@ -394,36 +423,13 @@ bootfs_name_valid(const char *pool, char *bootfs)
         return (B_FALSE);
  }
  
-#if defined(__sun__) || defined(__sun)
-/*
- * Inspect the configuration to determine if any of the devices contain
- * an EFI label.
- */
-static boolean_t
-pool_uses_efi(nvlist_t *config)
-{
-       nvlist_t **child;
-       uint_t c, children;
-
-       if (nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_CHILDREN,
-           &child, &children) != 0)
-               return (read_efi_label(config, NULL) >= 0);
-
-       for (c = 0; c < children; c++) {
-               if (pool_uses_efi(child[c]))
-                       return (B_TRUE);
-       }
-       return (B_FALSE);
-}
-#endif
-
  boolean_t
  zpool_is_bootable(zpool_handle_t *zhp)
  {
-       char bootfs[ZPOOL_MAXNAMELEN];
+       char bootfs[ZFS_MAX_DATASET_NAME_LEN];
  
         return (zpool_get_prop(zhp, ZPOOL_PROP_BOOTFS, bootfs,
-           sizeof (bootfs), NULL) == 0 && strncmp(bootfs, "-",
+           sizeof (bootfs), NULL, B_FALSE) == 0 && strncmp(bootfs, "-",
             sizeof (bootfs)) != 0);
  }
  
@@ -445,7 +451,6 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
         char *slash, *check;
         struct stat64 statbuf;
         zpool_handle_t *zhp;
-       nvlist_t *nvroot;
  
         if (nvlist_alloc(&retprops, NV_UNIQUE_NAME, 0) != 0) {
                 (void) no_memory(hdl);
@@ -457,7 +462,7 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                 const char *propname = nvpair_name(elem);
  
                 prop = zpool_name_to_prop(propname);
-               if (prop == ZPROP_INVAL && zpool_prop_feature(propname)) {
+               if (prop == ZPOOL_PROP_INVAL && zpool_prop_feature(propname)) {
                         int err;
                         char *fname = strchr(propname, '@') + 1;
  
@@ -478,10 +483,20 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                         }
  
                         (void) nvpair_value_string(elem, &strval);
-                       if (strcmp(strval, ZFS_FEATURE_ENABLED) != 0) {
+                       if (strcmp(strval, ZFS_FEATURE_ENABLED) != 0 &&
+                           strcmp(strval, ZFS_FEATURE_DISABLED) != 0) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "property '%s' can only be set to "
-                                   "'enabled'"), propname);
+                                   "'enabled' or 'disabled'"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+
+                       if (!flags.create &&
+                           strcmp(strval, ZFS_FEATURE_DISABLED) == 0) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "property '%s' can only be set to "
+                                   "'disabled' at creation time"), propname);
                                 (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
                                 goto error;
                         }
@@ -496,7 +511,7 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                 /*
                  * Make sure this property is valid and applies to this type.
                  */
-               if (prop == ZPROP_INVAL) {
+               if (prop == ZPOOL_PROP_INVAL) {
                         zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                             "invalid property '%s'"), propname);
                         (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
@@ -518,8 +533,6 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                  * Perform additional checking for specific properties.
                  */
                 switch (prop) {
-               default:
-                       break;
                 case ZPOOL_PROP_VERSION:
                         if (intval < version ||
                             !SPA_VERSION_IS_SUPPORTED(intval)) {
@@ -532,18 +545,13 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                         break;
  
                 case ZPOOL_PROP_ASHIFT:
-                       if (!flags.create) {
-                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "property '%s' can only be set at "
-                                   "creation time"), propname);
-                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
-                               goto error;
-                       }
-
-                       if (intval != 0 && (intval < 9 || intval > 13)) {
+                       if (intval != 0 &&
+                           (intval < ASHIFT_MIN || intval > ASHIFT_MAX)) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "property '%s' number %d is invalid."),
-                                   propname, intval);
+                                   "invalid '%s=%d' property: only values "
+                                   "between %" PRId32 " and %" PRId32 " "
+                                   "are allowed.\n"),
+                                   propname, intval, ASHIFT_MIN, ASHIFT_MAX);
                                 (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
                                 goto error;
                         }
@@ -570,8 +578,7 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                          * bootfs property value has to be a dataset name and
                          * the dataset has to be in the same pool as it sets to.
                          */
-                       if (strval[0] != '\0' && !bootfs_name_valid(poolname,
-                           strval)) {
+                       if (!bootfs_name_valid(poolname, strval)) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "'%s' "
                                     "is an invalid name"), strval);
                                 (void) zfs_error(hdl, EZFS_INVALIDNAME, errbuf);
@@ -584,23 +591,6 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                                 (void) zfs_error(hdl, EZFS_OPENFAILED, errbuf);
                                 goto error;
                         }
-                       verify(nvlist_lookup_nvlist(zpool_get_config(zhp, NULL),
-                           ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
-
-#if defined(__sun__) || defined(__sun)
-                       /*
-                        * bootfs property cannot be set on a disk which has
-                        * been EFI labeled.
-                        */
-                       if (pool_uses_efi(nvroot)) {
-                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "property '%s' not supported on "
-                                   "EFI labeled devices"), propname);
-                               (void) zfs_error(hdl, EZFS_POOL_NOTSUP, errbuf);
-                               zpool_close(zhp);
-                               goto error;
-                       }
-#endif
                         zpool_close(zhp);
                         break;
  
@@ -690,6 +680,27 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                                 goto error;
                         }
                         break;
+               case ZPOOL_PROP_TNAME:
+                       if (!flags.create) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "property '%s' can only be set at "
+                                   "creation time"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               case ZPOOL_PROP_MULTIHOST:
+                       if (get_system_hostid() == 0) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "requires a non-zero system hostid"));
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               default:
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "property '%s'(%d) not defined"), propname, prop);
+                       break;
                 }
         }
  
@@ -844,7 +855,7 @@ zpool_expand_proplist(zpool_handle_t *zhp, zprop_list_t **plp)
  
                 if (entry->pl_prop != ZPROP_INVAL &&
                     zpool_get_prop(zhp, entry->pl_prop, buf, sizeof (buf),
-                   NULL) == 0) {
+                   NULL, B_FALSE) == 0) {
                         if (strlen(buf) > entry->pl_width)
                                 entry->pl_width = strlen(buf);
                 }
@@ -871,7 +882,7 @@ zpool_prop_get_feature(zpool_handle_t *zhp, const char *propname, char *buf,
  
         /*
          * Convert from feature name to feature guid. This conversion is
-        * unecessary for unsupported@... properties because they already
+        * unnecessary for unsupported@... properties because they already
          * use guids.
          */
         if (supported) {
@@ -1000,14 +1011,21 @@ zpool_name_valid(libzfs_handle_t *hdl, boolean_t isopen, const char *pool)
                                     "trailing slash in name"));
                                 break;
  
-                       case NAME_ERR_MULTIPLE_AT:
+                       case NAME_ERR_MULTIPLE_DELIMITERS:
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "multiple '@' delimiters in name"));
+                                   "multiple '@' and/or '#' delimiters in "
+                                   "name"));
                                 break;
+
                         case NAME_ERR_NO_AT:
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "permission set is missing '@'"));
                                 break;
+
+                       default:
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "(%d) not defined"), why);
+                               break;
                         }
                 }
                 return (B_FALSE);
@@ -1117,12 +1135,9 @@ zpool_open(libzfs_handle_t *hdl, const char *pool)
  void
  zpool_close(zpool_handle_t *zhp)
  {
-       if (zhp->zpool_config)
-               nvlist_free(zhp->zpool_config);
-       if (zhp->zpool_old_config)
-               nvlist_free(zhp->zpool_old_config);
-       if (zhp->zpool_props)
-               nvlist_free(zhp->zpool_props);
+       nvlist_free(zhp->zpool_config);
+       nvlist_free(zhp->zpool_old_config);
+       nvlist_free(zhp->zpool_props);
         free(zhp);
  }
  
@@ -1157,6 +1172,9 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
         zfs_cmd_t zc = {"\0"};
         nvlist_t *zc_fsprops = NULL;
         nvlist_t *zc_props = NULL;
+       nvlist_t *hidden_args = NULL;
+       uint8_t *wkeydata = NULL;
+       uint_t wkeylen = 0;
         char msg[1024];
         int ret = -1;
  
@@ -1186,18 +1204,35 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                     zfs_prop_to_name(ZFS_PROP_ZONED), &zonestr) == 0) &&
                     strcmp(zonestr, "on") == 0);
  
-               if ((zc_fsprops = zfs_valid_proplist(hdl,
-                   ZFS_TYPE_FILESYSTEM, fsprops, zoned, NULL, msg)) == NULL) {
+               if ((zc_fsprops = zfs_valid_proplist(hdl, ZFS_TYPE_FILESYSTEM,
+                   fsprops, zoned, NULL, NULL, B_TRUE, msg)) == NULL) {
                         goto create_failed;
                 }
                 if (!zc_props &&
                     (nvlist_alloc(&zc_props, NV_UNIQUE_NAME, 0) != 0)) {
                         goto create_failed;
                 }
+               if (zfs_crypto_create(hdl, NULL, zc_fsprops, props,
+                   &wkeydata, &wkeylen) != 0) {
+                       zfs_error(hdl, EZFS_CRYPTOFAILED, msg);
+                       goto create_failed;
+               }
                 if (nvlist_add_nvlist(zc_props,
                     ZPOOL_ROOTFS_PROPS, zc_fsprops) != 0) {
                         goto create_failed;
                 }
+               if (wkeydata != NULL) {
+                       if (nvlist_alloc(&hidden_args, NV_UNIQUE_NAME, 0) != 0)
+                               goto create_failed;
+
+                       if (nvlist_add_uint8_array(hidden_args, "wkeydata",
+                           wkeydata, wkeylen) != 0)
+                               goto create_failed;
+
+                       if (nvlist_add_nvlist(zc_props, ZPOOL_HIDDEN_ARGS,
+                           hidden_args) != 0)
+                               goto create_failed;
+               }
         }
  
         if (zc_props && zcmd_write_src_nvlist(hdl, &zc, zc_props) != 0)
@@ -1210,6 +1245,9 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                 zcmd_free_nvlists(&zc);
                 nvlist_free(zc_props);
                 nvlist_free(zc_fsprops);
+               nvlist_free(hidden_args);
+               if (wkeydata != NULL)
+                       free(wkeydata);
  
                 switch (errno) {
                 case EBUSY:
@@ -1226,6 +1264,21 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                             "lvm device"));
                         return (zfs_error(hdl, EZFS_BADDEV, msg));
  
+               case ERANGE:
+                       /*
+                        * This happens if the record size is smaller or larger
+                        * than the allowed size range, or not a power of 2.
+                        *
+                        * NOTE: although zfs_valid_proplist is called earlier,
+                        * this case may have slipped through since the
+                        * pool does not exist yet and it is therefore
+                        * impossible to read properties e.g. max blocksize
+                        * from the pool.
+                        */
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "record size invalid"));
+                       return (zfs_error(hdl, EZFS_BADPROP, msg));
+
                 case EOVERFLOW:
                         /*
                          * This occurs when one of the devices is below
@@ -1236,7 +1289,8 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                         {
                                 char buf[64];
  
-                               zfs_nicenum(SPA_MINDEVSIZE, buf, sizeof (buf));
+                               zfs_nicebytes(SPA_MINDEVSIZE, buf,
+                                   sizeof (buf));
  
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "one or more devices is less than the "
@@ -1263,6 +1317,9 @@ create_failed:
         zcmd_free_nvlists(&zc);
         nvlist_free(zc_props);
         nvlist_free(zc_fsprops);
+       nvlist_free(hidden_args);
+       if (wkeydata != NULL)
+               free(wkeydata);
         return (ret);
  }
  
@@ -1336,27 +1393,6 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                 return (zfs_error(hdl, EZFS_BADVERSION, msg));
         }
  
-#if defined(__sun__) || defined(__sun)
-       if (zpool_is_bootable(zhp) && nvlist_lookup_nvlist_array(nvroot,
-           ZPOOL_CONFIG_SPARES, &spares, &nspares) == 0) {
-               uint64_t s;
-
-               for (s = 0; s < nspares; s++) {
-                       char *path;
-
-                       if (nvlist_lookup_string(spares[s], ZPOOL_CONFIG_PATH,
-                           &path) == 0 && pool_uses_efi(spares[s])) {
-                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "device '%s' contains an EFI label and "
-                                   "cannot be used on root pools."),
-                                   zpool_vdev_name(hdl, NULL, spares[s],
-                                   B_FALSE));
-                               return (zfs_error(hdl, EZFS_POOL_NOTSUP, msg));
-                       }
-               }
-       }
-#endif
-
         if (zpool_get_prop_int(zhp, ZPOOL_PROP_VERSION, NULL) <
             SPA_VERSION_L2CACHE &&
             nvlist_lookup_nvlist_array(nvroot, ZPOOL_CONFIG_L2CACHE,
@@ -1394,7 +1430,8 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                         {
                                 char buf[64];
  
-                               zfs_nicenum(SPA_MINDEVSIZE, buf, sizeof (buf));
+                               zfs_nicebytes(SPA_MINDEVSIZE, buf,
+                                   sizeof (buf));
  
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "device is less than the minimum "
@@ -1645,8 +1682,7 @@ zpool_import(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
  
         ret = zpool_import_props(hdl, config, newname, props,
             ZFS_IMPORT_NORMAL);
-       if (props)
-               nvlist_free(props);
+       nvlist_free(props);
         return (ret);
  }
  
@@ -1671,7 +1707,7 @@ print_vdev_tree(libzfs_handle_t *hdl, const char *name, nvlist_t *nv,
                 return;
  
         for (c = 0; c < children; c++) {
-               vname = zpool_vdev_name(hdl, NULL, child[c], B_TRUE);
+               vname = zpool_vdev_name(hdl, NULL, child[c], VDEV_NAME_TYPE_ID);
                 print_vdev_tree(hdl, vname, child[c], indent + 2);
                 free(vname);
         }
@@ -1739,7 +1775,7 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                 thename = origname;
         }
  
-       if (props) {
+       if (props != NULL) {
                 uint64_t version;
                 prop_flags_t flags = { .create = B_FALSE, .import = B_TRUE };
  
@@ -1747,12 +1783,13 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                     &version) == 0);
  
                 if ((props = zpool_valid_proplist(hdl, origname,
-                   props, version, flags, errbuf)) == NULL) {
+                   props, version, flags, errbuf)) == NULL)
                         return (-1);
-               } else if (zcmd_write_src_nvlist(hdl, &zc, props) != 0) {
+               if (zcmd_write_src_nvlist(hdl, &zc, props) != 0) {
                         nvlist_free(props);
                         return (-1);
                 }
+               nvlist_free(props);
         }
  
         (void) strlcpy(zc.zc_name, thename, sizeof (zc.zc_name));
@@ -1761,11 +1798,11 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
             &zc.zc_guid) == 0);
  
         if (zcmd_write_conf_nvlist(hdl, &zc, config) != 0) {
-               nvlist_free(props);
+               zcmd_free_nvlists(&zc);
                 return (-1);
         }
         if (zcmd_alloc_dst_nvlist(hdl, &zc, zc.zc_nvlist_conf_size * 2) != 0) {
-               nvlist_free(props);
+               zcmd_free_nvlists(&zc);
                 return (-1);
         }
  
@@ -1781,10 +1818,14 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                 error = errno;
  
         (void) zcmd_read_dst_nvlist(hdl, &zc, &nv);
+
+       zcmd_free_nvlists(&zc);
+
         zpool_get_rewind_policy(config, &policy);
  
         if (error) {
                 char desc[1024];
+               char aux[256];
  
                 /*
                  * Dry-run failed, but we print out what success
@@ -1830,6 +1871,47 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                         (void) zfs_error(hdl, EZFS_BADVERSION, desc);
                         break;
  
+               case EREMOTEIO:
+                       if (nv != NULL && nvlist_lookup_nvlist(nv,
+                           ZPOOL_CONFIG_LOAD_INFO, &nvinfo) == 0) {
+                               char *hostname = "<unknown>";
+                               uint64_t hostid = 0;
+                               mmp_state_t mmp_state;
+
+                               mmp_state = fnvlist_lookup_uint64(nvinfo,
+                                   ZPOOL_CONFIG_MMP_STATE);
+
+                               if (nvlist_exists(nvinfo,
+                                   ZPOOL_CONFIG_MMP_HOSTNAME))
+                                       hostname = fnvlist_lookup_string(nvinfo,
+                                           ZPOOL_CONFIG_MMP_HOSTNAME);
+
+                               if (nvlist_exists(nvinfo,
+                                   ZPOOL_CONFIG_MMP_HOSTID))
+                                       hostid = fnvlist_lookup_uint64(nvinfo,
+                                           ZPOOL_CONFIG_MMP_HOSTID);
+
+                               if (mmp_state == MMP_STATE_ACTIVE) {
+                                       (void) snprintf(aux, sizeof (aux),
+                                           dgettext(TEXT_DOMAIN, "pool is imp"
+                                           "orted on host '%s' (hostid=%lx).\n"
+                                           "Export the pool on the other "
+                                           "system, then run 'zpool import'."),
+                                           hostname, (unsigned long) hostid);
+                               } else if (mmp_state == MMP_STATE_NO_HOSTID) {
+                                       (void) snprintf(aux, sizeof (aux),
+                                           dgettext(TEXT_DOMAIN, "pool has "
+                                           "the multihost property on and "
+                                           "the\nsystem's hostid is not set. "
+                                           "Set a unique system hostid with "
+                                           "the zgenhostid(8) command.\n"));
+                               }
+
+                               (void) zfs_error_aux(hdl, aux);
+                       }
+                       (void) zfs_error(hdl, EZFS_ACTIVE_POOL, desc);
+                       break;
+
                 case EINVAL:
                         (void) zfs_error(hdl, EZFS_INVALCONFIG, desc);
                         break;
@@ -1863,7 +1945,12 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                             "one or more devices are already in use\n"));
                         (void) zfs_error(hdl, EZFS_BADDEV, desc);
                         break;
-
+               case ENAMETOOLONG:
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "new name of at least one dataset is longer than "
+                           "the maximum allowable length"));
+                       (void) zfs_error(hdl, EZFS_NAMETOOLONG, desc);
+                       break;
                 default:
                         (void) zpool_standard_error(hdl, error, desc);
                         zpool_explain_recover(hdl,
@@ -1892,9 +1979,6 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                 return (0);
         }
  
-       zcmd_free_nvlists(&zc);
-       nvlist_free(props);
-
         return (ret);
  }
  
@@ -1902,22 +1986,39 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
   * Scan the pool.
   */
  int
-zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
+zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func, pool_scrub_cmd_t cmd)
  {
         zfs_cmd_t zc = {"\0"};
         char msg[1024];
+       int err;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_cookie = func;
+       zc.zc_flags = cmd;
+
+       if (zfs_ioctl(hdl, ZFS_IOC_POOL_SCAN, &zc) == 0)
+               return (0);
+
+       err = errno;
  
-       if (zfs_ioctl(hdl, ZFS_IOC_POOL_SCAN, &zc) == 0 ||
-           (errno == ENOENT && func != POOL_SCAN_NONE))
+       /* ECANCELED on a scrub means we resumed a paused scrub */
+       if (err == ECANCELED && func == POOL_SCAN_SCRUB &&
+           cmd == POOL_SCRUB_NORMAL)
+               return (0);
+
+       if (err == ENOENT && func != POOL_SCAN_NONE && cmd == POOL_SCRUB_NORMAL)
                 return (0);
  
         if (func == POOL_SCAN_SCRUB) {
-               (void) snprintf(msg, sizeof (msg),
-                   dgettext(TEXT_DOMAIN, "cannot scrub %s"), zc.zc_name);
+               if (cmd == POOL_SCRUB_PAUSE) {
+                       (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
+                           "cannot pause scrubbing %s"), zc.zc_name);
+               } else {
+                       assert(cmd == POOL_SCRUB_NORMAL);
+                       (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
+                           "cannot scrub %s"), zc.zc_name);
+               }
         } else if (func == POOL_SCAN_NONE) {
                 (void) snprintf(msg, sizeof (msg),
                     dgettext(TEXT_DOMAIN, "cannot cancel scrubbing %s"),
@@ -1926,7 +2027,7 @@ zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
                 assert(!"unexpected result");
         }
  
-       if (errno == EBUSY) {
+       if (err == EBUSY) {
                 nvlist_t *nvroot;
                 pool_scan_stat_t *ps = NULL;
                 uint_t psc;
@@ -1935,14 +2036,18 @@ zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
                     ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
                 (void) nvlist_lookup_uint64_array(nvroot,
                     ZPOOL_CONFIG_SCAN_STATS, (uint64_t **)&ps, &psc);
-               if (ps && ps->pss_func == POOL_SCAN_SCRUB)
-                       return (zfs_error(hdl, EZFS_SCRUBBING, msg));
-               else
+               if (ps && ps->pss_func == POOL_SCAN_SCRUB) {
+                       if (cmd == POOL_SCRUB_PAUSE)
+                               return (zfs_error(hdl, EZFS_SCRUB_PAUSED, msg));
+                       else
+                               return (zfs_error(hdl, EZFS_SCRUBBING, msg));
+               } else {
                         return (zfs_error(hdl, EZFS_RESILVERING, msg));
-       } else if (errno == ENOENT) {
+               }
+       } else if (err == ENOENT) {
                 return (zfs_error(hdl, EZFS_NO_SCRUB, msg));
         } else {
-               return (zpool_standard_error(hdl, errno, msg));
+               return (zpool_standard_error(hdl, err, msg));
         }
  }
  
@@ -2037,10 +2142,7 @@ vdev_to_nvlist_iter(nvlist_t *nv, nvlist_t *search, boolean_t *avail_spare,
                                 break;
                         }
  
-                       verify(strncmp(type, VDEV_TYPE_RAIDZ,
-                           strlen(VDEV_TYPE_RAIDZ)) == 0 ||
-                           strncmp(type, VDEV_TYPE_MIRROR,
-                           strlen(VDEV_TYPE_MIRROR)) == 0);
+                       verify(zpool_vdev_is_interior(type));
                         verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_ID,
                             &id) == 0);
  
@@ -2147,10 +2249,13 @@ zpool_find_vdev_by_physpath(zpool_handle_t *zhp, const char *ppath,
  /*
   * Determine if we have an "interior" top-level vdev (i.e mirror/raidz).
   */
-boolean_t
+static boolean_t
  zpool_vdev_is_interior(const char *name)
  {
         if (strncmp(name, VDEV_TYPE_RAIDZ, strlen(VDEV_TYPE_RAIDZ)) == 0 ||
+           strncmp(name, VDEV_TYPE_SPARE, strlen(VDEV_TYPE_SPARE)) == 0 ||
+           strncmp(name,
+           VDEV_TYPE_REPLACING, strlen(VDEV_TYPE_REPLACING)) == 0 ||
             strncmp(name, VDEV_TYPE_MIRROR, strlen(VDEV_TYPE_MIRROR)) == 0)
                 return (B_TRUE);
         return (B_FALSE);
@@ -2189,7 +2294,7 @@ zpool_find_vdev(zpool_handle_t *zhp, const char *path, boolean_t *avail_spare,
  }
  
  static int
-vdev_online(nvlist_t *nv)
+vdev_is_online(nvlist_t *nv)
  {
         uint64_t ival;
  
@@ -2257,12 +2362,13 @@ vdev_get_physpaths(nvlist_t *nv, char *physpath, size_t phypath_size,
                                 return (EZFS_INVALCONFIG);
                 }
  
-               if (vdev_online(nv)) {
+               if (vdev_is_online(nv)) {
                         if ((ret = vdev_get_one_physpath(nv, physpath,
                             phypath_size, rsz)) != 0)
                                 return (ret);
                 }
         } else if (strcmp(type, VDEV_TYPE_MIRROR) == 0 ||
+           strcmp(type, VDEV_TYPE_RAIDZ) == 0 ||
             strcmp(type, VDEV_TYPE_REPLACING) == 0 ||
             (is_spare = (strcmp(type, VDEV_TYPE_SPARE) == 0))) {
                 nvlist_t **child;
@@ -2308,15 +2414,11 @@ zpool_get_config_physpath(nvlist_t *config, char *physpath, size_t phypath_size)
             &child, &count) != 0)
                 return (EZFS_INVALCONFIG);
  
-#if defined(__sun__) || defined(__sun)
         /*
-        * root pool can not have EFI labeled disks and can only have
-        * a single top-level vdev.
+        * root pool can only have a single top-level vdev.
          */
-       if (strcmp(type, VDEV_TYPE_ROOT) != 0 || count != 1 ||
-           pool_uses_efi(vdev_root))
+       if (strcmp(type, VDEV_TYPE_ROOT) != 0 || count != 1)
                 return (EZFS_POOL_INVALARG);
-#endif
  
         (void) vdev_get_physpaths(child[0], physpath, phypath_size, &rsz,
             B_FALSE);
@@ -2363,15 +2465,58 @@ zpool_relabel_disk(libzfs_handle_t *hdl, const char *path, const char *msg)
          * The module will do it for us in vdev_disk_open().
          */
         error = efi_use_whole_disk(fd);
+
+       /* Flush the buffers to disk and invalidate the page cache. */
+       (void) fsync(fd);
+       (void) ioctl(fd, BLKFLSBUF);
+
         (void) close(fd);
         if (error && error != VT_ENOSPC) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "cannot "
                     "relabel '%s': unable to read disk capacity"), path);
                 return (zfs_error(hdl, EZFS_NOCAP, msg));
         }
+
         return (0);
  }
  
+/*
+ * Convert a vdev path to a GUID.  Returns GUID or 0 on error.
+ *
+ * If is_spare, is_l2cache, or is_log is non-NULL, then store within it
+ * if the VDEV is a spare, l2cache, or log device.  If they're NULL then
+ * ignore them.
+ */
+static uint64_t
+zpool_vdev_path_to_guid_impl(zpool_handle_t *zhp, const char *path,
+    boolean_t *is_spare, boolean_t *is_l2cache, boolean_t *is_log)
+{
+       uint64_t guid;
+       boolean_t spare = B_FALSE, l2cache = B_FALSE, log = B_FALSE;
+       nvlist_t *tgt;
+
+       if ((tgt = zpool_find_vdev(zhp, path, &spare, &l2cache,
+           &log)) == NULL)
+               return (0);
+
+       verify(nvlist_lookup_uint64(tgt, ZPOOL_CONFIG_GUID, &guid) == 0);
+       if (is_spare != NULL)
+               *is_spare = spare;
+       if (is_l2cache != NULL)
+               *is_l2cache = l2cache;
+       if (is_log != NULL)
+               *is_log = log;
+
+       return (guid);
+}
+
+/* Convert a vdev path to a GUID.  Returns GUID or 0 on error. */
+uint64_t
+zpool_vdev_path_to_guid(zpool_handle_t *zhp, const char *path)
+{
+       return (zpool_vdev_path_to_guid_impl(zhp, path, NULL, NULL, NULL));
+}
+
  /*
   * Bring the specified vdev online.   The 'flags' parameter is a set of the
   * ZFS_ONLINE_* flags.
@@ -2382,6 +2527,7 @@ zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
  {
         zfs_cmd_t zc = {"\0"};
         char msg[1024];
+       char *pathname;
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache, islog;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
@@ -2405,8 +2551,9 @@ zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
         if (avail_spare)
                 return (zfs_error(hdl, EZFS_ISSPARE, msg));
  
-       if (flags & ZFS_ONLINE_EXPAND ||
-           zpool_get_prop_int(zhp, ZPOOL_PROP_AUTOEXPAND, NULL)) {
+       if ((flags & ZFS_ONLINE_EXPAND ||
+           zpool_get_prop_int(zhp, ZPOOL_PROP_AUTOEXPAND, NULL)) &&
+           nvlist_lookup_string(tgt, ZPOOL_CONFIG_PATH, &pathname) == 0) {
                 uint64_t wholedisk = 0;
  
                 (void) nvlist_lookup_uint64(tgt, ZPOOL_CONFIG_WHOLE_DISK,
@@ -2623,18 +2770,6 @@ zpool_vdev_attach(zpool_handle_t *zhp,
                 (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
                     "cannot attach %s to %s"), new_disk, old_disk);
  
-#if defined(__sun__) || defined(__sun)
-       /*
-        * If this is a root pool, make sure that we're not attaching an
-        * EFI labeled device.
-        */
-       if (rootpool && pool_uses_efi(nvroot)) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "EFI labeled devices are not supported on root pools."));
-               return (zfs_error(hdl, EZFS_POOL_NOTSUP, msg));
-       }
-#endif
-
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         if ((tgt = zpool_find_vdev(zhp, old_disk, &avail_spare, &l2cache,
             &islog)) == 0)
@@ -2659,7 +2794,7 @@ zpool_vdev_attach(zpool_handle_t *zhp,
         verify(nvlist_lookup_nvlist(zpool_get_config(zhp, NULL),
             ZPOOL_CONFIG_VDEV_TREE, &config_root) == 0);
  
-       if ((newname = zpool_vdev_name(NULL, NULL, child[0], B_FALSE)) == NULL)
+       if ((newname = zpool_vdev_name(NULL, NULL, child[0], 0)) == NULL)
                 return (-1);
  
         /*
@@ -2850,11 +2985,11 @@ find_vdev_entry(zpool_handle_t *zhp, nvlist_t **mchild, uint_t mchildren,
         for (mc = 0; mc < mchildren; mc++) {
                 uint_t sc;
                 char *mpath = zpool_vdev_name(zhp->zpool_hdl, zhp,
-                   mchild[mc], B_FALSE);
+                   mchild[mc], 0);
  
                 for (sc = 0; sc < schildren; sc++) {
                         char *spath = zpool_vdev_name(zhp->zpool_hdl, zhp,
-                           schild[sc], B_FALSE);
+                           schild[sc], 0);
                         boolean_t result = (strcmp(mpath, spath) == 0);
  
                         free(spath);
@@ -2884,7 +3019,7 @@ zpool_vdev_split(zpool_handle_t *zhp, char *newname, nvlist_t **newroot,
         nvlist_t **varray = NULL, *zc_props = NULL;
         uint_t c, children, newchildren, lastlog = 0, vcount, found = 0;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
-       uint64_t vers;
+       uint64_t vers, readonly = B_FALSE;
         boolean_t freelist = B_FALSE, memory_err = B_TRUE;
         int retval = 0;
  
@@ -2909,14 +3044,21 @@ zpool_vdev_split(zpool_handle_t *zhp, char *newname, nvlist_t **newroot,
                 if ((zc_props = zpool_valid_proplist(hdl, zhp->zpool_name,
                     props, vers, flags, msg)) == NULL)
                         return (-1);
+               (void) nvlist_lookup_uint64(zc_props,
+                   zpool_prop_to_name(ZPOOL_PROP_READONLY), &readonly);
+               if (readonly) {
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "property %s can only be set at import time"),
+                           zpool_prop_to_name(ZPOOL_PROP_READONLY));
+                       return (-1);
+               }
         }
  
         if (nvlist_lookup_nvlist_array(tree, ZPOOL_CONFIG_CHILDREN, &child,
             &children) != 0) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                     "Source pool is missing vdev tree"));
-               if (zc_props)
-                       nvlist_free(zc_props);
+               nvlist_free(zc_props);
                 return (-1);
         }
  
@@ -3064,10 +3206,8 @@ out:
                 free(varray);
         }
         zcmd_free_nvlists(&zc);
-       if (zc_props)
-               nvlist_free(zc_props);
-       if (newconfig)
-               nvlist_free(newconfig);
+       nvlist_free(zc_props);
+       nvlist_free(newconfig);
         if (freelist) {
                 nvlist_free(*newroot);
                 *newroot = NULL;
@@ -3083,8 +3223,8 @@ out:
  }
  
  /*
- * Remove the given device.  Currently, this is supported only for hot spares
- * and level 2 cache devices.
+ * Remove the given device.  Currently, this is supported only for hot spares,
+ * cache, and log devices.
   */
  int
  zpool_vdev_remove(zpool_handle_t *zhp, const char *path)
@@ -3108,7 +3248,7 @@ zpool_vdev_remove(zpool_handle_t *zhp, const char *path)
          */
         if (!avail_spare && !l2cache && !islog) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "only inactive hot spares, cache, top-level, "
+                   "only inactive hot spares, cache, "
                     "or log devices can be removed"));
                 return (zfs_error(hdl, EZFS_NODEVICE, msg));
         }
@@ -3252,22 +3392,44 @@ zpool_reguid(zpool_handle_t *zhp)
   * Reopen the pool.
   */
  int
-zpool_reopen(zpool_handle_t *zhp)
+zpool_reopen_one(zpool_handle_t *zhp, void *data)
  {
-       zfs_cmd_t zc = {"\0"};
-       char msg[1024];
-       libzfs_handle_t *hdl = zhp->zpool_hdl;
+       libzfs_handle_t *hdl = zpool_get_handle(zhp);
+       const char *pool_name = zpool_get_name(zhp);
+       boolean_t *scrub_restart = data;
+       int error;
  
-       (void) snprintf(msg, sizeof (msg),
-           dgettext(TEXT_DOMAIN, "cannot reopen '%s'"),
-           zhp->zpool_name);
+       error = lzc_reopen(pool_name, *scrub_restart);
+       if (error) {
+               return (zpool_standard_error_fmt(hdl, error,
+                   dgettext(TEXT_DOMAIN, "cannot reopen '%s'"), pool_name));
+       }
  
-       (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
-       if (zfs_ioctl(hdl, ZFS_IOC_POOL_REOPEN, &zc) == 0)
-               return (0);
-       return (zpool_standard_error(hdl, errno, msg));
+       return (0);
  }
  
+/* call into libzfs_core to execute the sync IOCTL per pool */
+int
+zpool_sync_one(zpool_handle_t *zhp, void *data)
+{
+       int ret;
+       libzfs_handle_t *hdl = zpool_get_handle(zhp);
+       const char *pool_name = zpool_get_name(zhp);
+       boolean_t *force = data;
+       nvlist_t *innvl = fnvlist_alloc();
+
+       fnvlist_add_boolean_value(innvl, "force", *force);
+       if ((ret = lzc_sync(pool_name, innvl, NULL)) != 0) {
+               nvlist_free(innvl);
+               return (zpool_standard_error_fmt(hdl, ret,
+                   dgettext(TEXT_DOMAIN, "sync '%s' failed"), pool_name));
+       }
+       nvlist_free(innvl);
+
+       return (0);
+}
+
+#if defined(__sun__) || defined(__sun)
  /*
   * Convert from a devid string to a path.
   */
@@ -3291,8 +3453,10 @@ devid_to_path(char *devid_str)
         if (ret != 0)
                 return (NULL);
  
-       if ((path = strdup(list[0].devname)) == NULL)
-               return (NULL);
+       /*
+        * In a case the strdup() fails, we will just return NULL below.
+        */
+       path = strdup(list[0].devname);
  
         devid_free_nmlist(list);
  
@@ -3343,36 +3507,82 @@ set_path(zpool_handle_t *zhp, nvlist_t *nv, const char *path)
  
         (void) ioctl(zhp->zpool_hdl->libzfs_fd, ZFS_IOC_VDEV_SETPATH, &zc);
  }
+#endif /* sun */
  
  /*
   * Remove partition suffix from a vdev path.  Partition suffixes may take three
   * forms: "-partX", "pX", or "X", where X is a string of digits.  The second
   * case only occurs when the suffix is preceded by a digit, i.e. "md0p0" The
   * third case only occurs when preceded by a string matching the regular
- * expression "^[hs]d[a-z]+", i.e. a scsi or ide disk.
+ * expression "^([hsv]|xv)d[a-z]+", i.e. a scsi, ide, virtio or xen disk.
+ *
+ * caller must free the returned string
   */
-static char *
-strip_partition(libzfs_handle_t *hdl, char *path)
+char *
+zfs_strip_partition(char *path)
  {
-       char *tmp = zfs_strdup(hdl, path);
+       char *tmp = strdup(path);
         char *part = NULL, *d = NULL;
+       if (!tmp)
+               return (NULL);
  
         if ((part = strstr(tmp, "-part")) && part != tmp) {
                 d = part + 5;
         } else if ((part = strrchr(tmp, 'p')) &&
             part > tmp + 1 && isdigit(*(part-1))) {
                 d = part + 1;
-       } else if ((tmp[0] == 'h' || tmp[0] == 's') && tmp[1] == 'd') {
-               for (d = &tmp[2]; isalpha(*d); part = ++d);
+       } else if ((tmp[0] == 'h' || tmp[0] == 's' || tmp[0] == 'v') &&
+           tmp[1] == 'd') {
+               for (d = &tmp[2]; isalpha(*d); part = ++d) { }
+       } else if (strncmp("xvd", tmp, 3) == 0) {
+               for (d = &tmp[3]; isalpha(*d); part = ++d) { }
         }
         if (part && d && *d != '\0') {
-               for (; isdigit(*d); d++);
+               for (; isdigit(*d); d++) { }
                 if (*d == '\0')
                         *part = '\0';
         }
+
         return (tmp);
  }
  
+/*
+ * Same as zfs_strip_partition, but allows "/dev/" to be in the pathname
+ *
+ * path:       /dev/sda1
+ * returns:    /dev/sda
+ *
+ * Returned string must be freed.
+ */
+char *
+zfs_strip_partition_path(char *path)
+{
+       char *newpath = strdup(path);
+       char *sd_offset;
+       char *new_sd;
+
+       if (!newpath)
+               return (NULL);
+
+       /* Point to "sda1" part of "/dev/sda1" */
+       sd_offset = strrchr(newpath, '/') + 1;
+
+       /* Get our new name "sda" */
+       new_sd = zfs_strip_partition(sd_offset);
+       if (!new_sd) {
+               free(newpath);
+               return (NULL);
+       }
+
+       /* Paste the "sda" where "sda1" was */
+       strlcpy(sd_offset, new_sd, strlen(sd_offset) + 1);
+
+       /* Free temporary "sda" */
+       free(new_sd);
+
+       return (newpath);
+}
+
  #define        PATH_BUF_LEN    64
  
  /*
@@ -3392,23 +3602,51 @@ strip_partition(libzfs_handle_t *hdl, char *path)
   */
  char *
  zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
-    boolean_t verbose)
+    int name_flags)
  {
-       char *path, *devid, *type;
+       char *path, *type, *env;
         uint64_t value;
         char buf[PATH_BUF_LEN];
         char tmpbuf[PATH_BUF_LEN];
-       vdev_stat_t *vs;
-       uint_t vsc;
  
-       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NOT_PRESENT,
-           &value) == 0) {
-               verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID,
-                   &value) == 0);
-               (void) snprintf(buf, sizeof (buf), "%llu",
-                   (u_longlong_t)value);
+       /*
+        * vdev_name will be "root"/"root-0" for the root vdev, but it is the
+        * zpool name that will be displayed to the user.
+        */
+       verify(nvlist_lookup_string(nv, ZPOOL_CONFIG_TYPE, &type) == 0);
+       if (zhp != NULL && strcmp(type, "root") == 0)
+               return (zfs_strdup(hdl, zpool_get_name(zhp)));
+
+       env = getenv("ZPOOL_VDEV_NAME_PATH");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_PATH;
+
+       env = getenv("ZPOOL_VDEV_NAME_GUID");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_GUID;
+
+       env = getenv("ZPOOL_VDEV_NAME_FOLLOW_LINKS");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_FOLLOW_LINKS;
+
+       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NOT_PRESENT, &value) == 0 ||
+           name_flags & VDEV_NAME_GUID) {
+               (void) nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID, &value);
+               (void) snprintf(buf, sizeof (buf), "%llu", (u_longlong_t)value);
                 path = buf;
         } else if (nvlist_lookup_string(nv, ZPOOL_CONFIG_PATH, &path) == 0) {
+#if defined(__sun__) || defined(__sun)
+               /*
+                * Live VDEV path updates to a kernel VDEV during a
+                * zpool_vdev_name lookup are not supported on Linux.
+                */
+               char *devid;
+               vdev_stat_t *vs;
+               uint_t vsc;
+
                 /*
                  * If the device is dead (faulted, offline, etc) then don't
                  * bother opening it.  Otherwise we may be forcing the user to
@@ -3446,12 +3684,22 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
                         if (newdevid)
                                 devid_str_free(newdevid);
                 }
+#endif /* sun */
+
+               if (name_flags & VDEV_NAME_FOLLOW_LINKS) {
+                       char *rp = realpath(path, NULL);
+                       if (rp) {
+                               strlcpy(buf, rp, sizeof (buf));
+                               path = buf;
+                               free(rp);
+                       }
+               }
  
                 /*
                  * For a block device only use the name.
                  */
-               verify(nvlist_lookup_string(nv, ZPOOL_CONFIG_TYPE, &type) == 0);
-               if (strcmp(type, VDEV_TYPE_DISK) == 0) {
+               if ((strcmp(type, VDEV_TYPE_DISK) == 0) &&
+                   !(name_flags & VDEV_NAME_PATH)) {
                         path = strrchr(path, '/');
                         path++;
                 }
@@ -3459,18 +3707,17 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
                 /*
                  * Remove the partition from the path it this is a whole disk.
                  */
-               if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_WHOLE_DISK,
-                   &value) == 0 && value) {
-                       return (strip_partition(hdl, path));
+               if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_WHOLE_DISK, &value)
+                   == 0 && value && !(name_flags & VDEV_NAME_PATH)) {
+                       return (zfs_strip_partition(path));
                 }
         } else {
-               verify(nvlist_lookup_string(nv, ZPOOL_CONFIG_TYPE, &path) == 0);
+               path = type;
  
                 /*
                  * If it's a raidz device, we need to stick in the parity level.
                  */
                 if (strcmp(path, VDEV_TYPE_RAIDZ) == 0) {
-
                         verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NPARITY,
                             &value) == 0);
                         (void) snprintf(buf, sizeof (buf), "%s%llu", path,
@@ -3482,9 +3729,8 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
                  * We identify each top-level vdev by using a <type-id>
                  * naming convention.
                  */
-               if (verbose) {
+               if (name_flags & VDEV_NAME_TYPE_ID) {
                         uint64_t id;
-
                         verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_ID,
                             &id) == 0);
                         (void) snprintf(tmpbuf, sizeof (tmpbuf), "%s-%llu",
@@ -3497,9 +3743,9 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
  }
  
  static int
-zbookmark_compare(const void *a, const void *b)
+zbookmark_mem_compare(const void *a, const void *b)
  {
-       return (memcmp(a, b, sizeof (zbookmark_t)));
+       return (memcmp(a, b, sizeof (zbookmark_phys_t)));
  }
  
  /*
@@ -3510,8 +3756,9 @@ int
  zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
  {
         zfs_cmd_t zc = {"\0"};
+       libzfs_handle_t *hdl = zhp->zpool_hdl;
         uint64_t count;
-       zbookmark_t *zb = NULL;
+       zbookmark_phys_t *zb = NULL;
         int i;
  
         /*
@@ -3523,9 +3770,8 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
             &count) == 0);
         if (count == 0)
                 return (0);
-       if ((zc.zc_nvlist_dst = (uintptr_t)zfs_alloc(zhp->zpool_hdl,
-           count * sizeof (zbookmark_t))) == (uintptr_t)NULL)
-               return (-1);
+       zc.zc_nvlist_dst = (uintptr_t)zfs_alloc(zhp->zpool_hdl,
+           count * sizeof (zbookmark_phys_t));
         zc.zc_nvlist_dst_size = count;
         (void) strcpy(zc.zc_name, zhp->zpool_name);
         for (;;) {
@@ -3533,13 +3779,16 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
                     &zc) != 0) {
                         free((void *)(uintptr_t)zc.zc_nvlist_dst);
                         if (errno == ENOMEM) {
+                               void *dst;
+
                                 count = zc.zc_nvlist_dst_size;
-                               if ((zc.zc_nvlist_dst = (uintptr_t)
-                                   zfs_alloc(zhp->zpool_hdl, count *
-                                   sizeof (zbookmark_t))) == (uintptr_t)NULL)
-                                       return (-1);
+                               dst = zfs_alloc(zhp->zpool_hdl, count *
+                                   sizeof (zbookmark_phys_t));
+                               zc.zc_nvlist_dst = (uintptr_t)dst;
                         } else {
-                               return (-1);
+                               return (zpool_standard_error_fmt(hdl, errno,
+                                   dgettext(TEXT_DOMAIN, "errors: List of "
+                                   "errors unavailable")));
                         }
                 } else {
                         break;
@@ -3553,11 +3802,11 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
          * _not_ copied as part of the process.  So we point the start of our
          * array appropriate and decrement the total number of elements.
          */
-       zb = ((zbookmark_t *)(uintptr_t)zc.zc_nvlist_dst) +
+       zb = ((zbookmark_phys_t *)(uintptr_t)zc.zc_nvlist_dst) +
             zc.zc_nvlist_dst_size;
         count -= zc.zc_nvlist_dst_size;
  
-       qsort(zb, count, sizeof (zbookmark_t), zbookmark_compare);
+       qsort(zb, count, sizeof (zbookmark_phys_t), zbookmark_mem_compare);
  
         verify(nvlist_alloc(nverrlistp, 0, KM_SLEEP) == 0);
  
@@ -3708,6 +3957,7 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
         uint64_t reclen;
         nvlist_t *nv;
         int i;
+       void *tmp;
  
         while (bytes_read > sizeof (reclen)) {
  
@@ -3727,8 +3977,14 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
                 /* add record to nvlist array */
                 (*numrecords)++;
                 if (ISP2(*numrecords + 1)) {
-                       *records = realloc(*records,
+                       tmp = realloc(*records,
                             *numrecords * 2 * sizeof (nvlist_t *));
+                       if (tmp == NULL) {
+                               nvlist_free(nv);
+                               (*numrecords)--;
+                               return (ENOMEM);
+                       }
+                       *records = tmp;
                 }
                 (*records)[*numrecords - 1] = nv;
         }
@@ -3737,22 +3993,24 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
         return (0);
  }
  
-#define        HIS_BUF_LEN     (128*1024)
-
  /*
   * Retrieve the command history of a pool.
   */
  int
  zpool_get_history(zpool_handle_t *zhp, nvlist_t **nvhisp)
  {
-       char buf[HIS_BUF_LEN];
+       char *buf;
+       int buflen = 128 * 1024;
         uint64_t off = 0;
         nvlist_t **records = NULL;
         uint_t numrecords = 0;
         int err, i;
  
+       buf = malloc(buflen);
+       if (buf == NULL)
+               return (ENOMEM);
         do {
-               uint64_t bytes_read = sizeof (buf);
+               uint64_t bytes_read = buflen;
                 uint64_t leftover;
  
                 if ((err = get_history(zhp, buf, &off, &bytes_read)) != 0)
@@ -3766,10 +4024,23 @@ zpool_get_history(zpool_handle_t *zhp, nvlist_t **nvhisp)
                     &leftover, &records, &numrecords)) != 0)
                         break;
                 off -= leftover;
+               if (leftover == bytes_read) {
+                       /*
+                        * no progress made, because buffer is not big enough
+                        * to hold this record; resize and retry.
+                        */
+                       buflen *= 2;
+                       free(buf);
+                       buf = malloc(buflen);
+                       if (buf == NULL)
+                               return (ENOMEM);
+               }
  
                 /* CONSTCOND */
         } while (1);
  
+       free(buf);
+
         if (!err) {
                 verify(nvlist_alloc(nvhisp, NV_UNIQUE_NAME, 0) == 0);
                 verify(nvlist_add_nvlist_array(*nvhisp, ZPOOL_HIST_RECORD,
@@ -3914,7 +4185,7 @@ zpool_obj_to_path(zpool_handle_t *zhp, uint64_t dsobj, uint64_t obj,
         zfs_cmd_t zc = {"\0"};
         boolean_t mounted = B_FALSE;
         char *mntpnt = NULL;
-       char dsname[MAXNAMELEN];
+       char dsname[ZFS_MAX_DATASET_NAME_LEN];
  
         if (dsobj == 0) {
                 /* special case for the MOS */
@@ -3976,7 +4247,7 @@ read_efi_label(nvlist_t *config, diskaddr_t *sb)
  
         (void) snprintf(diskname, sizeof (diskname), "%s%s", DISK_ROOT,
             strrchr(path, '/'));
-       if ((fd = open(diskname, O_RDWR|O_DIRECT)) >= 0) {
+       if ((fd = open(diskname, O_RDONLY|O_DIRECT)) >= 0) {
                 struct dk_gpt *vtoc;
  
                 if ((err = efi_alloc_and_read(fd, &vtoc)) >= 0) {
@@ -4022,36 +4293,13 @@ find_start_block(nvlist_t *config)
         return (MAXOFFSET_T);
  }
  
-int
-zpool_label_disk_wait(char *path, int timeout)
-{
-       struct stat64 statbuf;
-       int i;
-
-       /*
-        * Wait timeout miliseconds for a newly created device to be available
-        * from the given path.  There is a small window when a /dev/ device
-        * will exist and the udev link will not, so we must wait for the
-        * symlink.  Depending on the udev rules this may take a few seconds.
-        */
-       for (i = 0; i < timeout; i++) {
-               usleep(1000);
-
-               errno = 0;
-               if ((stat64(path, &statbuf) == 0) && (errno == 0))
-                       return (0);
-       }
-
-       return (ENOENT);
-}
-
-int
+static int
  zpool_label_disk_check(char *path)
  {
         struct dk_gpt *vtoc;
         int fd, err;
  
-       if ((fd = open(path, O_RDWR|O_DIRECT)) < 0)
+       if ((fd = open(path, O_RDONLY|O_DIRECT)) < 0)
                 return (errno);
  
         if ((err = efi_alloc_and_read(fd, &vtoc)) != 0) {
@@ -4070,6 +4318,32 @@ zpool_label_disk_check(char *path)
         return (0);
  }
  
+/*
+ * Generate a unique partition name for the ZFS member.  Partitions must
+ * have unique names to ensure udev will be able to create symlinks under
+ * /dev/disk/by-partlabel/ for all pool members.  The partition names are
+ * of the form <pool>-<unique-id>.
+ */
+static void
+zpool_label_name(char *label_name, int label_size)
+{
+       uint64_t id = 0;
+       int fd;
+
+       fd = open("/dev/urandom", O_RDONLY);
+       if (fd >= 0) {
+               if (read(fd, &id, sizeof (id)) != sizeof (id))
+                       id = 0;
+
+               close(fd);
+       }
+
+       if (id == 0)
+               id = (((uint64_t)rand()) << 32) | (uint64_t)rand();
+
+       snprintf(label_name, label_size, "zfs-%016llx", (u_longlong_t)id);
+}
+
  /*
   * Label an individual disk.  The name provided is the short name,
   * stripped of any leading /dev path.
@@ -4092,15 +4366,6 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
         if (zhp) {
                 nvlist_t *nvroot;
  
-#if defined(__sun__) || defined(__sun)
-               if (zpool_is_bootable(zhp)) {
-                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                           "EFI labeled devices are not supported on root "
-                           "pools."));
-                       return (zfs_error(hdl, EZFS_POOL_NOTSUP, errbuf));
-               }
-#endif
-
                 verify(nvlist_lookup_nvlist(zhp->zpool_config,
                     ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
  
@@ -4116,7 +4381,7 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
  
         (void) snprintf(path, sizeof (path), "%s/%s", DISK_ROOT, name);
  
-       if ((fd = open(path, O_RDWR|O_DIRECT)) < 0) {
+       if ((fd = open(path, O_RDWR|O_DIRECT|O_EXCL)) < 0) {
                 /*
                  * This shouldn't happen.  We've long since verified that this
                  * is a valid device.
@@ -4160,19 +4425,27 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
          * can get, in the absence of V_OTHER.
          */
         vtoc->efi_parts[0].p_tag = V_USR;
-       (void) strcpy(vtoc->efi_parts[0].p_name, "zfs");
+       zpool_label_name(vtoc->efi_parts[0].p_name, EFI_PART_NAME_LEN);
  
         vtoc->efi_parts[8].p_start = slice_size + start_block;
         vtoc->efi_parts[8].p_size = resv;
         vtoc->efi_parts[8].p_tag = V_RESERVED;
  
-       if ((rval = efi_write(fd, vtoc)) != 0 || (rval = efi_rescan(fd)) != 0) {
-               /*
-                * Some block drivers (like pcata) may not support EFI
-                * GPT labels.  Print out a helpful error message dir-
-                * ecting the user to manually label the disk and give
-                * a specific slice.
-                */
+       rval = efi_write(fd, vtoc);
+
+       /* Flush the buffers to disk and invalidate the page cache. */
+       (void) fsync(fd);
+       (void) ioctl(fd, BLKFLSBUF);
+
+       if (rval == 0)
+               rval = efi_rescan(fd);
+
+       /*
+        * Some block drivers (like pcata) may not support EFI GPT labels.
+        * Print out a helpful error message directing the user to manually
+        * label the disk and give a specific slice.
+        */
+       if (rval != 0) {
                 (void) close(fd);
                 efi_free(vtoc);
  
@@ -4184,12 +4457,11 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
         (void) close(fd);
         efi_free(vtoc);
  
-       /* Wait for the first expected partition to appear. */
-
         (void) snprintf(path, sizeof (path), "%s/%s", DISK_ROOT, name);
         (void) zfs_append_partition(path, MAXPATHLEN);
  
-       rval = zpool_label_disk_wait(path, 3000);
+       /* Wait to udev to signal use the device has settled. */
+       rval = zpool_label_disk_wait(path, DISK_LABEL_WAIT);
         if (rval) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "failed to "
                     "detect device partitions on '%s': %d"), path, rval);
@@ -4209,3 +4481,281 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
  
         return (0);
  }
+
+/*
+ * Allocate and return the underlying device name for a device mapper device.
+ * If a device mapper device maps to multiple devices, return the first device.
+ *
+ * For example, dm_name = "/dev/dm-0" could return "/dev/sda". Symlinks to a
+ * DM device (like /dev/disk/by-vdev/A0) are also allowed.
+ *
+ * Returns device name, or NULL on error or no match.  If dm_name is not a DM
+ * device then return NULL.
+ *
+ * NOTE: The returned name string must be *freed*.
+ */
+char *
+dm_get_underlying_path(char *dm_name)
+{
+       DIR *dp = NULL;
+       struct dirent *ep;
+       char *realp;
+       char *tmp = NULL;
+       char *path = NULL;
+       char *dev_str;
+       int size;
+
+       if (dm_name == NULL)
+               return (NULL);
+
+       /* dm name may be a symlink (like /dev/disk/by-vdev/A0) */
+       realp = realpath(dm_name, NULL);
+       if (realp == NULL)
+               return (NULL);
+
+       /*
+        * If they preface 'dev' with a path (like "/dev") then strip it off.
+        * We just want the 'dm-N' part.
+        */
+       tmp = strrchr(realp, '/');
+       if (tmp != NULL)
+               dev_str = tmp + 1;    /* +1 since we want the chr after '/' */
+       else
+               dev_str = tmp;
+
+       size = asprintf(&tmp, "/sys/block/%s/slaves/", dev_str);
+       if (size == -1 || !tmp)
+               goto end;
+
+       dp = opendir(tmp);
+       if (dp == NULL)
+               goto end;
+
+       /* Return first sd* entry in /sys/block/dm-N/slaves/ */
+       while ((ep = readdir(dp))) {
+               if (ep->d_type != DT_DIR) {     /* skip "." and ".." dirs */
+                       size = asprintf(&path, "/dev/%s", ep->d_name);
+                       break;
+               }
+       }
+
+end:
+       if (dp != NULL)
+               closedir(dp);
+       free(tmp);
+       free(realp);
+       return (path);
+}
+
+/*
+ * Return 1 if device is a device mapper or multipath device.
+ * Return 0 if not.
+ */
+int
+zfs_dev_is_dm(char *dev_name)
+{
+
+       char *tmp;
+       tmp = dm_get_underlying_path(dev_name);
+       if (tmp == NULL)
+               return (0);
+
+       free(tmp);
+       return (1);
+}
+
+/*
+ * By "whole disk" we mean an entire physical disk (something we can
+ * label, toggle the write cache on, etc.) as opposed to the full
+ * capacity of a pseudo-device such as lofi or did.  We act as if we
+ * are labeling the disk, which should be a pretty good test of whether
+ * it's a viable device or not.  Returns B_TRUE if it is and B_FALSE if
+ * it isn't.
+ */
+int
+zfs_dev_is_whole_disk(char *dev_name)
+{
+       struct dk_gpt *label;
+       int fd;
+
+       if ((fd = open(dev_name, O_RDONLY | O_DIRECT)) < 0)
+               return (0);
+
+       if (efi_alloc_and_init(fd, EFI_NUMPAR, &label) != 0) {
+               (void) close(fd);
+               return (0);
+       }
+
+       efi_free(label);
+       (void) close(fd);
+
+       return (1);
+}
+
+/*
+ * Lookup the underlying device for a device name
+ *
+ * Often you'll have a symlink to a device, a partition device,
+ * or a multipath device, and want to look up the underlying device.
+ * This function returns the underlying device name.  If the device
+ * name is already the underlying device, then just return the same
+ * name.  If the device is a DM device with multiple underlying devices
+ * then return the first one.
+ *
+ * For example:
+ *
+ * 1. /dev/disk/by-id/ata-QEMU_HARDDISK_QM00001 -> ../../sda
+ * dev_name:   /dev/disk/by-id/ata-QEMU_HARDDISK_QM00001
+ * returns:    /dev/sda
+ *
+ * 2. /dev/mapper/mpatha (made up of /dev/sda and /dev/sdb)
+ * dev_name:   /dev/mapper/mpatha
+ * returns:    /dev/sda (first device)
+ *
+ * 3. /dev/sda (already the underlying device)
+ * dev_name:   /dev/sda
+ * returns:    /dev/sda
+ *
+ * 4. /dev/dm-3 (mapped to /dev/sda)
+ * dev_name:   /dev/dm-3
+ * returns:    /dev/sda
+ *
+ * 5. /dev/disk/by-id/scsi-0QEMU_drive-scsi0-0-0-0-part9 -> ../../sdb9
+ * dev_name:   /dev/disk/by-id/scsi-0QEMU_drive-scsi0-0-0-0-part9
+ * returns:    /dev/sdb
+ *
+ * 6. /dev/disk/by-uuid/5df030cf-3cd9-46e4-8e99-3ccb462a4e9a -> ../dev/sda2
+ * dev_name:   /dev/disk/by-uuid/5df030cf-3cd9-46e4-8e99-3ccb462a4e9a
+ * returns:    /dev/sda
+ *
+ * Returns underlying device name, or NULL on error or no match.
+ *
+ * NOTE: The returned name string must be *freed*.
+ */
+char *
+zfs_get_underlying_path(char *dev_name)
+{
+       char *name = NULL;
+       char *tmp;
+
+       if (dev_name == NULL)
+               return (NULL);
+
+       tmp = dm_get_underlying_path(dev_name);
+
+       /* dev_name not a DM device, so just un-symlinkize it */
+       if (tmp == NULL)
+               tmp = realpath(dev_name, NULL);
+
+       if (tmp != NULL) {
+               name = zfs_strip_partition_path(tmp);
+               free(tmp);
+       }
+
+       return (name);
+}
+
+/*
+ * Given a dev name like "sda", return the full enclosure sysfs path to
+ * the disk.  You can also pass in the name with "/dev" prepended
+ * to it (like /dev/sda).
+ *
+ * For example, disk "sda" in enclosure slot 1:
+ *     dev:            "sda"
+ *     returns:        "/sys/class/enclosure/1:0:3:0/Slot 1"
+ *
+ * 'dev' must be a non-devicemapper device.
+ *
+ * Returned string must be freed.
+ */
+char *
+zfs_get_enclosure_sysfs_path(char *dev_name)
+{
+       DIR *dp = NULL;
+       struct dirent *ep;
+       char buf[MAXPATHLEN];
+       char *tmp1 = NULL;
+       char *tmp2 = NULL;
+       char *tmp3 = NULL;
+       char *path = NULL;
+       size_t size;
+       int tmpsize;
+
+       if (dev_name == NULL)
+               return (NULL);
+
+       /* If they preface 'dev' with a path (like "/dev") then strip it off */
+       tmp1 = strrchr(dev_name, '/');
+       if (tmp1 != NULL)
+               dev_name = tmp1 + 1;    /* +1 since we want the chr after '/' */
+
+       tmpsize = asprintf(&tmp1, "/sys/block/%s/device", dev_name);
+       if (tmpsize == -1 || tmp1 == NULL) {
+               tmp1 = NULL;
+               goto end;
+       }
+
+       dp = opendir(tmp1);
+       if (dp == NULL) {
+               tmp1 = NULL;    /* To make free() at the end a NOP */
+               goto end;
+       }
+
+       /*
+        * Look though all sysfs entries in /sys/block/<dev>/device for
+        * the enclosure symlink.
+        */
+       while ((ep = readdir(dp))) {
+               /* Ignore everything that's not our enclosure_device link */
+               if (strstr(ep->d_name, "enclosure_device") == NULL)
+                       continue;
+
+               if (asprintf(&tmp2, "%s/%s", tmp1, ep->d_name) == -1 ||
+                   tmp2 == NULL)
+                       break;
+
+               size = readlink(tmp2, buf, sizeof (buf));
+
+               /* Did readlink fail or crop the link name? */
+               if (size == -1 || size >= sizeof (buf)) {
+                       free(tmp2);
+                       tmp2 = NULL;    /* To make free() at the end a NOP */
+                       break;
+               }
+
+               /*
+                * We got a valid link.  readlink() doesn't terminate strings
+                * so we have to do it.
+                */
+               buf[size] = '\0';
+
+               /*
+                * Our link will look like:
+                *
+                * "../../../../port-11:1:2/..STUFF../enclosure/1:0:3:0/SLOT 1"
+                *
+                * We want to grab the "enclosure/1:0:3:0/SLOT 1" part
+                */
+               tmp3 = strstr(buf, "enclosure");
+               if (tmp3 == NULL)
+                       break;
+
+               if (asprintf(&path, "/sys/class/%s", tmp3) == -1) {
+                       /* If asprintf() fails, 'path' is undefined */
+                       path = NULL;
+                       break;
+               }
+
+               if (path == NULL)
+                       break;
+       }
+
+end:
+       free(tmp2);
+       free(tmp1);
+
+       if (dp != NULL)
+               closedir(dp);
+
+       return (path);
+}