Add libtpool (thread pools)

[mirror_zfs.git] / lib / libzfs / libzfs_pool.c
diff --git a/lib/libzfs/libzfs_pool.c b/lib/libzfs/libzfs_pool.c

index 7836e587354c0526ab6e4ac698dc087f8086702e..d3363809d2b179ef54fc07557563972e821da07c 100644 (file)
--- a/lib/libzfs/libzfs_pool.c
+++ b/lib/libzfs/libzfs_pool.c
@@ -20,7 +20,11 @@
   */
  
  /*
+ * Copyright 2015 Nexenta Systems, Inc.  All rights reserved.
   * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2011, 2014 by Delphix. All rights reserved.
+ * Copyright 2016 Igor Kozhukhov <ikozhukhov@gmail.com>
+ * Copyright (c) 2017 Datto Inc.
   */
  
  #include <ctype.h>
@@ -32,7 +36,11 @@
  #include <stdlib.h>
  #include <strings.h>
  #include <unistd.h>
+#include <libgen.h>
+#include <zone.h>
+#include <sys/stat.h>
  #include <sys/efi_partition.h>
+#include <sys/systeminfo.h>
  #include <sys/vtoc.h>
  #include <sys/zfs_ioctl.h>
  #include <dlfcn.h>
@@ -41,18 +49,14 @@
  #include "zfs_prop.h"
  #include "libzfs_impl.h"
  #include "zfs_comutil.h"
+#include "zfeature_common.h"
  
  static int read_efi_label(nvlist_t *config, diskaddr_t *sb);
  
-#if defined(__i386) || defined(__amd64)
-#define        BOOTCMD "installgrub(1M)"
-#else
-#define        BOOTCMD "installboot(1M)"
-#endif
-
-#define        DISK_ROOT       "/dev/dsk"
-#define        RDISK_ROOT      "/dev/rdsk"
-#define        BACKUP_SLICE    "s2"
+typedef struct prop_flags {
+       int create:1;   /* Validate property on creation */
+       int import:1;   /* Validate property on import */
+} prop_flags_t;
  
  /*
   * ====================================================================
@@ -63,7 +67,7 @@ static int read_efi_label(nvlist_t *config, diskaddr_t *sb);
  static int
  zpool_get_all_props(zpool_handle_t *zhp)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
@@ -197,6 +201,39 @@ zpool_state_to_name(vdev_state_t state, vdev_aux_t aux)
                 return (gettext("DEGRADED"));
         case VDEV_STATE_HEALTHY:
                 return (gettext("ONLINE"));
+
+       default:
+               break;
+       }
+
+       return (gettext("UNKNOWN"));
+}
+
+/*
+ * Map POOL STATE to printed strings.
+ */
+const char *
+zpool_pool_state_to_name(pool_state_t state)
+{
+       switch (state) {
+       default:
+               break;
+       case POOL_STATE_ACTIVE:
+               return (gettext("ACTIVE"));
+       case POOL_STATE_EXPORTED:
+               return (gettext("EXPORTED"));
+       case POOL_STATE_DESTROYED:
+               return (gettext("DESTROYED"));
+       case POOL_STATE_SPARE:
+               return (gettext("SPARE"));
+       case POOL_STATE_L2CACHE:
+               return (gettext("L2CACHE"));
+       case POOL_STATE_UNINITIALIZED:
+               return (gettext("UNINITIALIZED"));
+       case POOL_STATE_UNAVAIL:
+               return (gettext("UNAVAIL"));
+       case POOL_STATE_POTENTIALLY_ACTIVE:
+               return (gettext("POTENTIALLY_ACTIVE"));
         }
  
         return (gettext("UNKNOWN"));
@@ -207,8 +244,8 @@ zpool_state_to_name(vdev_state_t state, vdev_aux_t aux)
   * a pre-allocated buffer.
   */
  int
-zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf, size_t len,
-    zprop_source_t *srctype)
+zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf,
+    size_t len, zprop_source_t *srctype, boolean_t literal)
  {
         uint64_t intval;
         const char *strval;
@@ -229,19 +266,18 @@ zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf, size_t len,
  
                 case ZPOOL_PROP_GUID:
                         intval = zpool_get_prop_int(zhp, prop, &src);
-                       (void) snprintf(buf, len, "%llu", intval);
+                       (void) snprintf(buf, len, "%llu", (u_longlong_t)intval);
                         break;
  
                 case ZPOOL_PROP_ALTROOT:
                 case ZPOOL_PROP_CACHEFILE:
+               case ZPOOL_PROP_COMMENT:
                         if (zhp->zpool_props != NULL ||
                             zpool_get_all_props(zhp) == 0) {
                                 (void) strlcpy(buf,
                                     zpool_get_prop_string(zhp, prop, &src),
                                     len);
-                               if (srctype != NULL)
-                                       *srctype = src;
-                               return (0);
+                               break;
                         }
                         /* FALLTHROUGH */
                 default:
@@ -271,18 +307,58 @@ zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf, size_t len,
                 case ZPOOL_PROP_SIZE:
                 case ZPOOL_PROP_ALLOCATED:
                 case ZPOOL_PROP_FREE:
-                       (void) zfs_nicenum(intval, buf, len);
+               case ZPOOL_PROP_FREEING:
+               case ZPOOL_PROP_LEAKED:
+               case ZPOOL_PROP_ASHIFT:
+                       if (literal)
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       else
+                               (void) zfs_nicenum(intval, buf, len);
+                       break;
+
+               case ZPOOL_PROP_EXPANDSZ:
+                       if (intval == 0) {
+                               (void) strlcpy(buf, "-", len);
+                       } else if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) zfs_nicebytes(intval, buf, len);
+                       }
                         break;
  
                 case ZPOOL_PROP_CAPACITY:
-                       (void) snprintf(buf, len, "%llu%%",
-                           (u_longlong_t)intval);
+                       if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) snprintf(buf, len, "%llu%%",
+                                   (u_longlong_t)intval);
+                       }
+                       break;
+
+               case ZPOOL_PROP_FRAGMENTATION:
+                       if (intval == UINT64_MAX) {
+                               (void) strlcpy(buf, "-", len);
+                       } else if (literal) {
+                               (void) snprintf(buf, len, "%llu",
+                                   (u_longlong_t)intval);
+                       } else {
+                               (void) snprintf(buf, len, "%llu%%",
+                                   (u_longlong_t)intval);
+                       }
                         break;
  
                 case ZPOOL_PROP_DEDUPRATIO:
-                       (void) snprintf(buf, len, "%llu.%02llux",
-                           (u_longlong_t)(intval / 100),
-                           (u_longlong_t)(intval % 100));
+                       if (literal)
+                               (void) snprintf(buf, len, "%llu.%02llu",
+                                   (u_longlong_t)(intval / 100),
+                                   (u_longlong_t)(intval % 100));
+                       else
+                               (void) snprintf(buf, len, "%llu.%02llux",
+                                   (u_longlong_t)(intval / 100),
+                                   (u_longlong_t)(intval % 100));
                         break;
  
                 case ZPOOL_PROP_HEALTH:
@@ -295,8 +371,14 @@ zpool_get_prop(zpool_handle_t *zhp, zpool_prop_t prop, char *buf, size_t len,
                         (void) strlcpy(buf, zpool_state_to_name(intval,
                             vs->vs_aux), len);
                         break;
+               case ZPOOL_PROP_VERSION:
+                       if (intval >= SPA_VERSION_FEATURES) {
+                               (void) snprintf(buf, len, "-");
+                               break;
+                       }
+                       /* FALLTHROUGH */
                 default:
-                       (void) snprintf(buf, len, "%llu", intval);
+                       (void) snprintf(buf, len, "%llu", (u_longlong_t)intval);
                 }
                 break;
  
@@ -337,34 +419,13 @@ bootfs_name_valid(const char *pool, char *bootfs)
         return (B_FALSE);
  }
  
-/*
- * Inspect the configuration to determine if any of the devices contain
- * an EFI label.
- */
-static boolean_t
-pool_uses_efi(nvlist_t *config)
-{
-       nvlist_t **child;
-       uint_t c, children;
-
-       if (nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_CHILDREN,
-           &child, &children) != 0)
-               return (read_efi_label(config, NULL) >= 0);
-
-       for (c = 0; c < children; c++) {
-               if (pool_uses_efi(child[c]))
-                       return (B_TRUE);
-       }
-       return (B_FALSE);
-}
-
-static boolean_t
-pool_is_bootable(zpool_handle_t *zhp)
+boolean_t
+zpool_is_bootable(zpool_handle_t *zhp)
  {
-       char bootfs[ZPOOL_MAXNAMELEN];
+       char bootfs[ZFS_MAX_DATASET_NAME_LEN];
  
         return (zpool_get_prop(zhp, ZPOOL_PROP_BOOTFS, bootfs,
-           sizeof (bootfs), NULL) == 0 && strncmp(bootfs, "-",
+           sizeof (bootfs), NULL, B_FALSE) == 0 && strncmp(bootfs, "-",
             sizeof (bootfs)) != 0);
  }
  
@@ -376,17 +437,16 @@ pool_is_bootable(zpool_handle_t *zhp)
   */
  static nvlist_t *
  zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
-    nvlist_t *props, uint64_t version, boolean_t create_or_import, char *errbuf)
+    nvlist_t *props, uint64_t version, prop_flags_t flags, char *errbuf)
  {
         nvpair_t *elem;
         nvlist_t *retprops;
         zpool_prop_t prop;
         char *strval;
         uint64_t intval;
-       char *slash;
+       char *slash, *check;
         struct stat64 statbuf;
         zpool_handle_t *zhp;
-       nvlist_t *nvroot;
  
         if (nvlist_alloc(&retprops, NV_UNIQUE_NAME, 0) != 0) {
                 (void) no_memory(hdl);
@@ -397,10 +457,48 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
         while ((elem = nvlist_next_nvpair(props, elem)) != NULL) {
                 const char *propname = nvpair_name(elem);
  
+               prop = zpool_name_to_prop(propname);
+               if (prop == ZPROP_INVAL && zpool_prop_feature(propname)) {
+                       int err;
+                       char *fname = strchr(propname, '@') + 1;
+
+                       err = zfeature_lookup_name(fname, NULL);
+                       if (err != 0) {
+                               ASSERT3U(err, ==, ENOENT);
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "invalid feature '%s'"), fname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+
+                       if (nvpair_type(elem) != DATA_TYPE_STRING) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "'%s' must be a string"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+
+                       (void) nvpair_value_string(elem, &strval);
+                       if (strcmp(strval, ZFS_FEATURE_ENABLED) != 0 &&
+                           strcmp(strval, ZFS_FEATURE_DISABLED) != 0) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "property '%s' can only be set to "
+                                   "'enabled' or 'disabled'"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+
+                       if (nvlist_add_uint64(retprops, propname, 0) != 0) {
+                               (void) no_memory(hdl);
+                               goto error;
+                       }
+                       continue;
+               }
+
                 /*
                  * Make sure this property is valid and applies to this type.
                  */
-               if ((prop = zpool_name_to_prop(propname)) == ZPROP_INVAL) {
+               if (prop == ZPROP_INVAL) {
                         zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                             "invalid property '%s'"), propname);
                         (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
@@ -423,7 +521,8 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                  */
                 switch (prop) {
                 case ZPOOL_PROP_VERSION:
-                       if (intval < version || intval > SPA_VERSION) {
+                       if (intval < version ||
+                           !SPA_VERSION_IS_SUPPORTED(intval)) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "property '%s' number %d is invalid."),
                                     propname, intval);
@@ -432,8 +531,21 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                         }
                         break;
  
+               case ZPOOL_PROP_ASHIFT:
+                       if (intval != 0 &&
+                           (intval < ASHIFT_MIN || intval > ASHIFT_MAX)) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "invalid '%s=%d' property: only values "
+                                   "between %" PRId32 " and %" PRId32 " "
+                                   "are allowed.\n"),
+                                   propname, intval, ASHIFT_MIN, ASHIFT_MAX);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+
                 case ZPOOL_PROP_BOOTFS:
-                       if (create_or_import) {
+                       if (flags.create || flags.import) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "property '%s' cannot be set at creation "
                                     "or import time"), propname);
@@ -467,26 +579,11 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
                                 (void) zfs_error(hdl, EZFS_OPENFAILED, errbuf);
                                 goto error;
                         }
-                       verify(nvlist_lookup_nvlist(zpool_get_config(zhp, NULL),
-                           ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
-
-                       /*
-                        * bootfs property cannot be set on a disk which has
-                        * been EFI labeled.
-                        */
-                       if (pool_uses_efi(nvroot)) {
-                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "property '%s' not supported on "
-                                   "EFI labeled devices"), propname);
-                               (void) zfs_error(hdl, EZFS_POOL_NOTSUP, errbuf);
-                               zpool_close(zhp);
-                               goto error;
-                       }
                         zpool_close(zhp);
                         break;
  
                 case ZPOOL_PROP_ALTROOT:
-                       if (!create_or_import) {
+                       if (!flags.create && !flags.import) {
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "property '%s' can only be set during pool "
                                     "creation or import"), propname);
@@ -541,6 +638,57 @@ zpool_valid_proplist(libzfs_handle_t *hdl, const char *poolname,
  
                         *slash = '/';
                         break;
+
+               case ZPOOL_PROP_COMMENT:
+                       for (check = strval; *check != '\0'; check++) {
+                               if (!isprint(*check)) {
+                                       zfs_error_aux(hdl,
+                                           dgettext(TEXT_DOMAIN,
+                                           "comment may only have printable "
+                                           "characters"));
+                                       (void) zfs_error(hdl, EZFS_BADPROP,
+                                           errbuf);
+                                       goto error;
+                               }
+                       }
+                       if (strlen(strval) > ZPROP_MAX_COMMENT) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "comment must not exceed %d characters"),
+                                   ZPROP_MAX_COMMENT);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               case ZPOOL_PROP_READONLY:
+                       if (!flags.import) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "property '%s' can only be set at "
+                                   "import time"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               case ZPOOL_PROP_TNAME:
+                       if (!flags.create) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "property '%s' can only be set at "
+                                   "creation time"), propname);
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               case ZPOOL_PROP_MULTIHOST:
+                       if (get_system_hostid() == 0) {
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "requires a non-zero system hostid"));
+                               (void) zfs_error(hdl, EZFS_BADPROP, errbuf);
+                               goto error;
+                       }
+                       break;
+               default:
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "property '%s'(%d) not defined"), propname, prop);
+                       break;
                 }
         }
  
@@ -556,12 +704,13 @@ error:
  int
  zpool_set_prop(zpool_handle_t *zhp, const char *propname, const char *propval)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         int ret = -1;
         char errbuf[1024];
         nvlist_t *nvl = NULL;
         nvlist_t *realprops;
         uint64_t version;
+       prop_flags_t flags = { 0 };
  
         (void) snprintf(errbuf, sizeof (errbuf),
             dgettext(TEXT_DOMAIN, "cannot set property for '%s'"),
@@ -577,7 +726,7 @@ zpool_set_prop(zpool_handle_t *zhp, const char *propname, const char *propval)
  
         version = zpool_get_prop_int(zhp, ZPOOL_PROP_VERSION, NULL);
         if ((realprops = zpool_valid_proplist(zhp->zpool_hdl,
-           zhp->zpool_name, nvl, version, B_FALSE, errbuf)) == NULL) {
+           zhp->zpool_name, nvl, version, flags, errbuf)) == NULL) {
                 nvlist_free(nvl);
                 return (-1);
         }
@@ -614,10 +763,79 @@ zpool_expand_proplist(zpool_handle_t *zhp, zprop_list_t **plp)
         libzfs_handle_t *hdl = zhp->zpool_hdl;
         zprop_list_t *entry;
         char buf[ZFS_MAXPROPLEN];
+       nvlist_t *features = NULL;
+       nvpair_t *nvp;
+       zprop_list_t **last;
+       boolean_t firstexpand = (NULL == *plp);
+       int i;
  
         if (zprop_expand_list(hdl, plp, ZFS_TYPE_POOL) != 0)
                 return (-1);
  
+       last = plp;
+       while (*last != NULL)
+               last = &(*last)->pl_next;
+
+       if ((*plp)->pl_all)
+               features = zpool_get_features(zhp);
+
+       if ((*plp)->pl_all && firstexpand) {
+               for (i = 0; i < SPA_FEATURES; i++) {
+                       zprop_list_t *entry = zfs_alloc(hdl,
+                           sizeof (zprop_list_t));
+                       entry->pl_prop = ZPROP_INVAL;
+                       entry->pl_user_prop = zfs_asprintf(hdl, "feature@%s",
+                           spa_feature_table[i].fi_uname);
+                       entry->pl_width = strlen(entry->pl_user_prop);
+                       entry->pl_all = B_TRUE;
+
+                       *last = entry;
+                       last = &entry->pl_next;
+               }
+       }
+
+       /* add any unsupported features */
+       for (nvp = nvlist_next_nvpair(features, NULL);
+           nvp != NULL; nvp = nvlist_next_nvpair(features, nvp)) {
+               char *propname;
+               boolean_t found;
+               zprop_list_t *entry;
+
+               if (zfeature_is_supported(nvpair_name(nvp)))
+                       continue;
+
+               propname = zfs_asprintf(hdl, "unsupported@%s",
+                   nvpair_name(nvp));
+
+               /*
+                * Before adding the property to the list make sure that no
+                * other pool already added the same property.
+                */
+               found = B_FALSE;
+               entry = *plp;
+               while (entry != NULL) {
+                       if (entry->pl_user_prop != NULL &&
+                           strcmp(propname, entry->pl_user_prop) == 0) {
+                               found = B_TRUE;
+                               break;
+                       }
+                       entry = entry->pl_next;
+               }
+               if (found) {
+                       free(propname);
+                       continue;
+               }
+
+               entry = zfs_alloc(hdl, sizeof (zprop_list_t));
+               entry->pl_prop = ZPROP_INVAL;
+               entry->pl_user_prop = propname;
+               entry->pl_width = strlen(entry->pl_user_prop);
+               entry->pl_all = B_TRUE;
+
+               *last = entry;
+               last = &entry->pl_next;
+       }
+
         for (entry = *plp; entry != NULL; entry = entry->pl_next) {
  
                 if (entry->pl_fixed)
@@ -625,7 +843,7 @@ zpool_expand_proplist(zpool_handle_t *zhp, zprop_list_t **plp)
  
                 if (entry->pl_prop != ZPROP_INVAL &&
                     zpool_get_prop(zhp, entry->pl_prop, buf, sizeof (buf),
-                   NULL) == 0) {
+                   NULL, B_FALSE) == 0) {
                         if (strlen(buf) > entry->pl_width)
                                 entry->pl_width = strlen(buf);
                 }
@@ -634,12 +852,77 @@ zpool_expand_proplist(zpool_handle_t *zhp, zprop_list_t **plp)
         return (0);
  }
  
+/*
+ * Get the state for the given feature on the given ZFS pool.
+ */
+int
+zpool_prop_get_feature(zpool_handle_t *zhp, const char *propname, char *buf,
+    size_t len)
+{
+       uint64_t refcount;
+       boolean_t found = B_FALSE;
+       nvlist_t *features = zpool_get_features(zhp);
+       boolean_t supported;
+       const char *feature = strchr(propname, '@') + 1;
+
+       supported = zpool_prop_feature(propname);
+       ASSERT(supported || zpool_prop_unsupported(propname));
+
+       /*
+        * Convert from feature name to feature guid. This conversion is
+        * unnecessary for unsupported@... properties because they already
+        * use guids.
+        */
+       if (supported) {
+               int ret;
+               spa_feature_t fid;
+
+               ret = zfeature_lookup_name(feature, &fid);
+               if (ret != 0) {
+                       (void) strlcpy(buf, "-", len);
+                       return (ENOTSUP);
+               }
+               feature = spa_feature_table[fid].fi_guid;
+       }
+
+       if (nvlist_lookup_uint64(features, feature, &refcount) == 0)
+               found = B_TRUE;
+
+       if (supported) {
+               if (!found) {
+                       (void) strlcpy(buf, ZFS_FEATURE_DISABLED, len);
+               } else  {
+                       if (refcount == 0)
+                               (void) strlcpy(buf, ZFS_FEATURE_ENABLED, len);
+                       else
+                               (void) strlcpy(buf, ZFS_FEATURE_ACTIVE, len);
+               }
+       } else {
+               if (found) {
+                       if (refcount == 0) {
+                               (void) strcpy(buf, ZFS_UNSUPPORTED_INACTIVE);
+                       } else {
+                               (void) strcpy(buf, ZFS_UNSUPPORTED_READONLY);
+                       }
+               } else {
+                       (void) strlcpy(buf, "-", len);
+                       return (ENOTSUP);
+               }
+       }
+
+       return (0);
+}
  
  /*
   * Don't start the slice at the default block of 34; many storage
- * devices will use a stripe width of 128k, so start there instead.
+ * devices will use a stripe width of 128k, other vendors prefer a 1m
+ * alignment.  It is best to play it safe and ensure a 1m alignment
+ * given 512B blocks.  When the block size is larger by a power of 2
+ * we will still be 1m aligned.  Some devices are sensitive to the
+ * partition ending alignment as well.
   */
-#define        NEW_START_BLOCK 256
+#define        NEW_START_BLOCK         2048
+#define        PARTITION_END_ALIGNMENT 2048
  
  /*
   * Validate the given pool name, optionally putting an extended error message in
@@ -716,11 +999,21 @@ zpool_name_valid(libzfs_handle_t *hdl, boolean_t isopen, const char *pool)
                                     "trailing slash in name"));
                                 break;
  
-                       case NAME_ERR_MULTIPLE_AT:
+                       case NAME_ERR_MULTIPLE_DELIMITERS:
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "multiple '@' and/or '#' delimiters in "
+                                   "name"));
+                               break;
+
+                       case NAME_ERR_NO_AT:
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "multiple '@' delimiters in name"));
+                                   "permission set is missing '@'"));
                                 break;
  
+                       default:
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "(%d) not defined"), why);
+                               break;
                         }
                 }
                 return (B_FALSE);
@@ -830,12 +1123,9 @@ zpool_open(libzfs_handle_t *hdl, const char *pool)
  void
  zpool_close(zpool_handle_t *zhp)
  {
-       if (zhp->zpool_config)
-               nvlist_free(zhp->zpool_config);
-       if (zhp->zpool_old_config)
-               nvlist_free(zhp->zpool_old_config);
-       if (zhp->zpool_props)
-               nvlist_free(zhp->zpool_props);
+       nvlist_free(zhp->zpool_config);
+       nvlist_free(zhp->zpool_old_config);
+       nvlist_free(zhp->zpool_props);
         free(zhp);
  }
  
@@ -867,11 +1157,10 @@ int
  zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
      nvlist_t *props, nvlist_t *fsprops)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         nvlist_t *zc_fsprops = NULL;
         nvlist_t *zc_props = NULL;
         char msg[1024];
-       char *altroot;
         int ret = -1;
  
         (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
@@ -884,8 +1173,10 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                 return (-1);
  
         if (props) {
+               prop_flags_t flags = { .create = B_TRUE, .import = B_FALSE };
+
                 if ((zc_props = zpool_valid_proplist(hdl, pool, props,
-                   SPA_VERSION_1, B_TRUE, msg)) == NULL) {
+                   SPA_VERSION_1, flags, msg)) == NULL) {
                         goto create_failed;
                 }
         }
@@ -898,8 +1189,8 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                     zfs_prop_to_name(ZFS_PROP_ZONED), &zonestr) == 0) &&
                     strcmp(zonestr, "on") == 0);
  
-               if ((zc_fsprops = zfs_valid_proplist(hdl,
-                   ZFS_TYPE_FILESYSTEM, fsprops, zoned, NULL, msg)) == NULL) {
+               if ((zc_fsprops = zfs_valid_proplist(hdl, ZFS_TYPE_FILESYSTEM,
+                   fsprops, zoned, NULL, NULL, msg)) == NULL) {
                         goto create_failed;
                 }
                 if (!zc_props &&
@@ -929,12 +1220,30 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                          * This can happen if the user has specified the same
                          * device multiple times.  We can't reliably detect this
                          * until we try to add it and see we already have a
-                        * label.
+                        * label.  This can also happen under if the device is
+                        * part of an active md or lvm device.
                          */
                         zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                           "one or more vdevs refer to the same device"));
+                           "one or more vdevs refer to the same device, or "
+                           "one of\nthe devices is part of an active md or "
+                           "lvm device"));
                         return (zfs_error(hdl, EZFS_BADDEV, msg));
  
+               case ERANGE:
+                       /*
+                        * This happens if the record size is smaller or larger
+                        * than the allowed size range, or not a power of 2.
+                        *
+                        * NOTE: although zfs_valid_proplist is called earlier,
+                        * this case may have slipped through since the
+                        * pool does not exist yet and it is therefore
+                        * impossible to read properties e.g. max blocksize
+                        * from the pool.
+                        */
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "record size invalid"));
+                       return (zfs_error(hdl, EZFS_BADPROP, msg));
+
                 case EOVERFLOW:
                         /*
                          * This occurs when one of the devices is below
@@ -945,7 +1254,8 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                         {
                                 char buf[64];
  
-                               zfs_nicenum(SPA_MINDEVSIZE, buf, sizeof (buf));
+                               zfs_nicebytes(SPA_MINDEVSIZE, buf,
+                                   sizeof (buf));
  
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "one or more devices is less than the "
@@ -968,21 +1278,6 @@ zpool_create(libzfs_handle_t *hdl, const char *pool, nvlist_t *nvroot,
                 }
         }
  
-       /*
-        * If this is an alternate root pool, then we automatically set the
-        * mountpoint of the root dataset to be '/'.
-        */
-       if (nvlist_lookup_string(props, zpool_prop_to_name(ZPOOL_PROP_ALTROOT),
-           &altroot) == 0) {
-               zfs_handle_t *zhp;
-
-               verify((zhp = zfs_open(hdl, pool, ZFS_TYPE_DATASET)) != NULL);
-               verify(zfs_prop_set(zhp, zfs_prop_to_name(ZFS_PROP_MOUNTPOINT),
-                   "/") == 0);
-
-               zfs_close(zhp);
-       }
-
  create_failed:
         zcmd_free_nvlists(&zc);
         nvlist_free(zc_props);
@@ -995,21 +1290,21 @@ create_failed:
   * datasets left in the pool.
   */
  int
-zpool_destroy(zpool_handle_t *zhp)
+zpool_destroy(zpool_handle_t *zhp, const char *log_str)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         zfs_handle_t *zfp = NULL;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
         char msg[1024];
  
         if (zhp->zpool_state == POOL_STATE_ACTIVE &&
-           (zfp = zfs_open(zhp->zpool_hdl, zhp->zpool_name,
-           ZFS_TYPE_FILESYSTEM)) == NULL)
+           (zfp = zfs_open(hdl, zhp->zpool_name, ZFS_TYPE_FILESYSTEM)) == NULL)
                 return (-1);
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
+       zc.zc_history = (uint64_t)(uintptr_t)log_str;
  
-       if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_POOL_DESTROY, &zc) != 0) {
+       if (zfs_ioctl(hdl, ZFS_IOC_POOL_DESTROY, &zc) != 0) {
                 (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
                     "cannot destroy '%s'"), zhp->zpool_name);
  
@@ -1041,7 +1336,7 @@ zpool_destroy(zpool_handle_t *zhp)
  int
  zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         int ret;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
         char msg[1024];
@@ -1060,25 +1355,6 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                 return (zfs_error(hdl, EZFS_BADVERSION, msg));
         }
  
-       if (pool_is_bootable(zhp) && nvlist_lookup_nvlist_array(nvroot,
-           ZPOOL_CONFIG_SPARES, &spares, &nspares) == 0) {
-               uint64_t s;
-
-               for (s = 0; s < nspares; s++) {
-                       char *path;
-
-                       if (nvlist_lookup_string(spares[s], ZPOOL_CONFIG_PATH,
-                           &path) == 0 && pool_uses_efi(spares[s])) {
-                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                                   "device '%s' contains an EFI label and "
-                                   "cannot be used on root pools."),
-                                   zpool_vdev_name(hdl, NULL, spares[s],
-                                   B_FALSE));
-                               return (zfs_error(hdl, EZFS_POOL_NOTSUP, msg));
-                       }
-               }
-       }
-
         if (zpool_get_prop_int(zhp, ZPOOL_PROP_VERSION, NULL) <
             SPA_VERSION_L2CACHE &&
             nvlist_lookup_nvlist_array(nvroot, ZPOOL_CONFIG_L2CACHE,
@@ -1092,7 +1368,7 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                 return (-1);
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
  
-       if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_VDEV_ADD, &zc) != 0) {
+       if (zfs_ioctl(hdl, ZFS_IOC_VDEV_ADD, &zc) != 0) {
                 switch (errno) {
                 case EBUSY:
                         /*
@@ -1116,7 +1392,8 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                         {
                                 char buf[64];
  
-                               zfs_nicenum(SPA_MINDEVSIZE, buf, sizeof (buf));
+                               zfs_nicebytes(SPA_MINDEVSIZE, buf,
+                                   sizeof (buf));
  
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "device is less than the minimum "
@@ -1131,13 +1408,6 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
                         (void) zfs_error(hdl, EZFS_BADVERSION, msg);
                         break;
  
-               case EDOM:
-                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                           "root pool can not have multiple vdevs"
-                           " or separate logs"));
-                       (void) zfs_error(hdl, EZFS_POOL_NOTSUP, msg);
-                       break;
-
                 case ENOTBLK:
                         zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                             "cache device must be a disk or disk slice"));
@@ -1162,10 +1432,11 @@ zpool_add(zpool_handle_t *zhp, nvlist_t *nvroot)
   * Exports the pool from the system.  The caller must ensure that there are no
   * mounted datasets in the pool.
   */
-int
-zpool_export_common(zpool_handle_t *zhp, boolean_t force, boolean_t hardforce)
+static int
+zpool_export_common(zpool_handle_t *zhp, boolean_t force, boolean_t hardforce,
+    const char *log_str)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
  
         (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
@@ -1174,6 +1445,7 @@ zpool_export_common(zpool_handle_t *zhp, boolean_t force, boolean_t hardforce)
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_cookie = force;
         zc.zc_guid = hardforce;
+       zc.zc_history = (uint64_t)(uintptr_t)log_str;
  
         if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_POOL_EXPORT, &zc) != 0) {
                 switch (errno) {
@@ -1195,35 +1467,41 @@ zpool_export_common(zpool_handle_t *zhp, boolean_t force, boolean_t hardforce)
  }
  
  int
-zpool_export(zpool_handle_t *zhp, boolean_t force)
+zpool_export(zpool_handle_t *zhp, boolean_t force, const char *log_str)
  {
-       return (zpool_export_common(zhp, force, B_FALSE));
+       return (zpool_export_common(zhp, force, B_FALSE, log_str));
  }
  
  int
-zpool_export_force(zpool_handle_t *zhp)
+zpool_export_force(zpool_handle_t *zhp, const char *log_str)
  {
-       return (zpool_export_common(zhp, B_TRUE, B_TRUE));
+       return (zpool_export_common(zhp, B_TRUE, B_TRUE, log_str));
  }
  
  static void
  zpool_rewind_exclaim(libzfs_handle_t *hdl, const char *name, boolean_t dryrun,
-    nvlist_t *rbi)
+    nvlist_t *config)
  {
+       nvlist_t *nv = NULL;
         uint64_t rewindto;
         int64_t loss = -1;
         struct tm t;
         char timestr[128];
  
-       if (!hdl->libzfs_printerr || rbi == NULL)
+       if (!hdl->libzfs_printerr || config == NULL)
                 return;
  
-       if (nvlist_lookup_uint64(rbi, ZPOOL_CONFIG_LOAD_TIME, &rewindto) != 0)
+       if (nvlist_lookup_nvlist(config, ZPOOL_CONFIG_LOAD_INFO, &nv) != 0 ||
+           nvlist_lookup_nvlist(nv, ZPOOL_CONFIG_REWIND_INFO, &nv) != 0) {
                 return;
-       (void) nvlist_lookup_int64(rbi, ZPOOL_CONFIG_REWIND_TIME, &loss);
+       }
+
+       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_LOAD_TIME, &rewindto) != 0)
+               return;
+       (void) nvlist_lookup_int64(nv, ZPOOL_CONFIG_REWIND_TIME, &loss);
  
         if (localtime_r((time_t *)&rewindto, &t) != NULL &&
-           strftime(timestr, 128, 0, &t) != 0) {
+           strftime(timestr, 128, "%c", &t) != 0) {
                 if (dryrun) {
                         (void) printf(dgettext(TEXT_DOMAIN,
                             "Would be able to return %s "
@@ -1238,13 +1516,14 @@ zpool_rewind_exclaim(libzfs_handle_t *hdl, const char *name, boolean_t dryrun,
                         (void) printf(dgettext(TEXT_DOMAIN,
                             "%s approximately %lld "),
                             dryrun ? "Would discard" : "Discarded",
-                           (loss + 30) / 60);
+                           ((longlong_t)loss + 30) / 60);
                         (void) printf(dgettext(TEXT_DOMAIN,
                             "minutes of transactions.\n"));
                 } else if (loss > 0) {
                         (void) printf(dgettext(TEXT_DOMAIN,
                             "%s approximately %lld "),
-                           dryrun ? "Would discard" : "Discarded", loss);
+                           dryrun ? "Would discard" : "Discarded",
+                           (longlong_t)loss);
                         (void) printf(dgettext(TEXT_DOMAIN,
                             "seconds of transactions.\n"));
                 }
@@ -1255,6 +1534,7 @@ void
  zpool_explain_recover(libzfs_handle_t *hdl, const char *name, int reason,
      nvlist_t *config)
  {
+       nvlist_t *nv = NULL;
         int64_t loss = -1;
         uint64_t edata = UINT64_MAX;
         uint64_t rewindto;
@@ -1270,19 +1550,20 @@ zpool_explain_recover(libzfs_handle_t *hdl, const char *name, int reason,
                 (void) printf(dgettext(TEXT_DOMAIN, "\t"));
  
         /* All attempted rewinds failed if ZPOOL_CONFIG_LOAD_TIME missing */
-       if (nvlist_lookup_uint64(config,
-           ZPOOL_CONFIG_LOAD_TIME, &rewindto) != 0)
+       if (nvlist_lookup_nvlist(config, ZPOOL_CONFIG_LOAD_INFO, &nv) != 0 ||
+           nvlist_lookup_nvlist(nv, ZPOOL_CONFIG_REWIND_INFO, &nv) != 0 ||
+           nvlist_lookup_uint64(nv, ZPOOL_CONFIG_LOAD_TIME, &rewindto) != 0)
                 goto no_info;
  
-       (void) nvlist_lookup_int64(config, ZPOOL_CONFIG_REWIND_TIME, &loss);
-       (void) nvlist_lookup_uint64(config, ZPOOL_CONFIG_LOAD_DATA_ERRORS,
+       (void) nvlist_lookup_int64(nv, ZPOOL_CONFIG_REWIND_TIME, &loss);
+       (void) nvlist_lookup_uint64(nv, ZPOOL_CONFIG_LOAD_DATA_ERRORS,
             &edata);
  
         (void) printf(dgettext(TEXT_DOMAIN,
             "Recovery is possible, but will result in some data loss.\n"));
  
         if (localtime_r((time_t *)&rewindto, &t) != NULL &&
-           strftime(timestr, 128, 0, &t) != 0) {
+           strftime(timestr, 128, "%c", &t) != 0) {
                 (void) printf(dgettext(TEXT_DOMAIN,
                     "\tReturning the pool to its state as of %s\n"
                     "\tshould correct the problem.  "),
@@ -1296,11 +1577,13 @@ zpool_explain_recover(libzfs_handle_t *hdl, const char *name, int reason,
         if (loss > 120) {
                 (void) printf(dgettext(TEXT_DOMAIN,
                     "Approximately %lld minutes of data\n"
-                   "\tmust be discarded, irreversibly.  "), (loss + 30) / 60);
+                   "\tmust be discarded, irreversibly.  "),
+                   ((longlong_t)loss + 30) / 60);
         } else if (loss > 0) {
                 (void) printf(dgettext(TEXT_DOMAIN,
                     "Approximately %lld seconds of data\n"
-                   "\tmust be discarded, irreversibly.  "), loss);
+                   "\tmust be discarded, irreversibly.  "),
+                   (longlong_t)loss);
         }
         if (edata != 0 && edata != UINT64_MAX) {
                 if (edata == 1) {
@@ -1359,12 +1642,64 @@ zpool_import(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                 }
         }
  
-       ret = zpool_import_props(hdl, config, newname, props, B_FALSE);
-       if (props)
-               nvlist_free(props);
+       ret = zpool_import_props(hdl, config, newname, props,
+           ZFS_IMPORT_NORMAL);
+       nvlist_free(props);
         return (ret);
  }
  
+static void
+print_vdev_tree(libzfs_handle_t *hdl, const char *name, nvlist_t *nv,
+    int indent)
+{
+       nvlist_t **child;
+       uint_t c, children;
+       char *vname;
+       uint64_t is_log = 0;
+
+       (void) nvlist_lookup_uint64(nv, ZPOOL_CONFIG_IS_LOG,
+           &is_log);
+
+       if (name != NULL)
+               (void) printf("\t%*s%s%s\n", indent, "", name,
+                   is_log ? " [log]" : "");
+
+       if (nvlist_lookup_nvlist_array(nv, ZPOOL_CONFIG_CHILDREN,
+           &child, &children) != 0)
+               return;
+
+       for (c = 0; c < children; c++) {
+               vname = zpool_vdev_name(hdl, NULL, child[c], VDEV_NAME_TYPE_ID);
+               print_vdev_tree(hdl, vname, child[c], indent + 2);
+               free(vname);
+       }
+}
+
+void
+zpool_print_unsup_feat(nvlist_t *config)
+{
+       nvlist_t *nvinfo, *unsup_feat;
+       nvpair_t *nvp;
+
+       verify(nvlist_lookup_nvlist(config, ZPOOL_CONFIG_LOAD_INFO, &nvinfo) ==
+           0);
+       verify(nvlist_lookup_nvlist(nvinfo, ZPOOL_CONFIG_UNSUP_FEAT,
+           &unsup_feat) == 0);
+
+       for (nvp = nvlist_next_nvpair(unsup_feat, NULL); nvp != NULL;
+           nvp = nvlist_next_nvpair(unsup_feat, nvp)) {
+               char *desc;
+
+               verify(nvpair_type(nvp) == DATA_TYPE_STRING);
+               verify(nvpair_value_string(nvp, &desc) == 0);
+
+               if (strlen(desc) > 0)
+                       (void) printf("\t%s (%s)\n", nvpair_name(nvp), desc);
+               else
+                       (void) printf("\t%s\n", nvpair_name(nvp));
+       }
+}
+
  /*
   * Import the given pool using the known configuration and a list of
   * properties to be set. The configuration should have come from
@@ -1373,15 +1708,17 @@ zpool_import(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
   */
  int
  zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
-    nvlist_t *props, boolean_t importfaulted)
+    nvlist_t *props, int flags)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         zpool_rewind_policy_t policy;
-       nvlist_t *nvi = NULL;
+       nvlist_t *nv = NULL;
+       nvlist_t *nvinfo = NULL;
+       nvlist_t *missing = NULL;
         char *thename;
         char *origname;
-       uint64_t returned_size;
         int ret;
+       int error = 0;
         char errbuf[1024];
  
         verify(nvlist_lookup_string(config, ZPOOL_CONFIG_POOL_NAME,
@@ -1400,19 +1737,21 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                 thename = origname;
         }
  
-       if (props) {
+       if (props != NULL) {
                 uint64_t version;
+               prop_flags_t flags = { .create = B_FALSE, .import = B_TRUE };
  
                 verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_VERSION,
                     &version) == 0);
  
                 if ((props = zpool_valid_proplist(hdl, origname,
-                   props, version, B_TRUE, errbuf)) == NULL) {
+                   props, version, flags, errbuf)) == NULL)
                         return (-1);
-               } else if (zcmd_write_src_nvlist(hdl, &zc, props) != 0) {
+               if (zcmd_write_src_nvlist(hdl, &zc, props) != 0) {
                         nvlist_free(props);
                         return (-1);
                 }
+               nvlist_free(props);
         }
  
         (void) strlcpy(zc.zc_name, thename, sizeof (zc.zc_name));
@@ -1421,30 +1760,43 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
             &zc.zc_guid) == 0);
  
         if (zcmd_write_conf_nvlist(hdl, &zc, config) != 0) {
-               nvlist_free(props);
+               zcmd_free_nvlists(&zc);
                 return (-1);
         }
-       returned_size =  zc.zc_nvlist_conf_size + 512;
-       if (zcmd_alloc_dst_nvlist(hdl, &zc, returned_size) != 0) {
-               nvlist_free(props);
+       if (zcmd_alloc_dst_nvlist(hdl, &zc, zc.zc_nvlist_conf_size * 2) != 0) {
+               zcmd_free_nvlists(&zc);
                 return (-1);
         }
  
-       zc.zc_cookie = (uint64_t)importfaulted;
-       ret = 0;
-       if (zfs_ioctl(hdl, ZFS_IOC_POOL_IMPORT, &zc) != 0) {
+       zc.zc_cookie = flags;
+       while ((ret = zfs_ioctl(hdl, ZFS_IOC_POOL_IMPORT, &zc)) != 0 &&
+           errno == ENOMEM) {
+               if (zcmd_expand_dst_nvlist(hdl, &zc) != 0) {
+                       zcmd_free_nvlists(&zc);
+                       return (-1);
+               }
+       }
+       if (ret != 0)
+               error = errno;
+
+       (void) zcmd_read_dst_nvlist(hdl, &zc, &nv);
+
+       zcmd_free_nvlists(&zc);
+
+       zpool_get_rewind_policy(config, &policy);
+
+       if (error) {
                 char desc[1024];
+               char aux[256];
  
-               (void) zcmd_read_dst_nvlist(hdl, &zc, &nvi);
-               zpool_get_rewind_policy(config, &policy);
                 /*
                  * Dry-run failed, but we print out what success
                  * looks like if we found a best txg
                  */
-               if ((policy.zrp_request & ZPOOL_TRY_REWIND) && nvi) {
+               if (policy.zrp_request & ZPOOL_TRY_REWIND) {
                         zpool_rewind_exclaim(hdl, newname ? origname : thename,
-                           B_TRUE, nvi);
-                       nvlist_free(nvi);
+                           B_TRUE, nv);
+                       nvlist_free(nv);
                         return (-1);
                 }
  
@@ -1457,14 +1809,71 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                             dgettext(TEXT_DOMAIN, "cannot import '%s' as '%s'"),
                             origname, thename);
  
-               switch (errno) {
+               switch (error) {
                 case ENOTSUP:
+                       if (nv != NULL && nvlist_lookup_nvlist(nv,
+                           ZPOOL_CONFIG_LOAD_INFO, &nvinfo) == 0 &&
+                           nvlist_exists(nvinfo, ZPOOL_CONFIG_UNSUP_FEAT)) {
+                               (void) printf(dgettext(TEXT_DOMAIN, "This "
+                                   "pool uses the following feature(s) not "
+                                   "supported by this system:\n"));
+                               zpool_print_unsup_feat(nv);
+                               if (nvlist_exists(nvinfo,
+                                   ZPOOL_CONFIG_CAN_RDONLY)) {
+                                       (void) printf(dgettext(TEXT_DOMAIN,
+                                           "All unsupported features are only "
+                                           "required for writing to the pool."
+                                           "\nThe pool can be imported using "
+                                           "'-o readonly=on'.\n"));
+                               }
+                       }
                         /*
                          * Unsupported version.
                          */
                         (void) zfs_error(hdl, EZFS_BADVERSION, desc);
                         break;
  
+               case EREMOTEIO:
+                       if (nv != NULL && nvlist_lookup_nvlist(nv,
+                           ZPOOL_CONFIG_LOAD_INFO, &nvinfo) == 0) {
+                               char *hostname = "<unknown>";
+                               uint64_t hostid = 0;
+                               mmp_state_t mmp_state;
+
+                               mmp_state = fnvlist_lookup_uint64(nvinfo,
+                                   ZPOOL_CONFIG_MMP_STATE);
+
+                               if (nvlist_exists(nvinfo,
+                                   ZPOOL_CONFIG_MMP_HOSTNAME))
+                                       hostname = fnvlist_lookup_string(nvinfo,
+                                           ZPOOL_CONFIG_MMP_HOSTNAME);
+
+                               if (nvlist_exists(nvinfo,
+                                   ZPOOL_CONFIG_MMP_HOSTID))
+                                       hostid = fnvlist_lookup_uint64(nvinfo,
+                                           ZPOOL_CONFIG_MMP_HOSTID);
+
+                               if (mmp_state == MMP_STATE_ACTIVE) {
+                                       (void) snprintf(aux, sizeof (aux),
+                                           dgettext(TEXT_DOMAIN, "pool is imp"
+                                           "orted on host '%s' (hostid=%lx).\n"
+                                           "Export the pool on the other "
+                                           "system, then run 'zpool import'."),
+                                           hostname, (unsigned long) hostid);
+                               } else if (mmp_state == MMP_STATE_NO_HOSTID) {
+                                       (void) snprintf(aux, sizeof (aux),
+                                           dgettext(TEXT_DOMAIN, "pool has "
+                                           "the multihost property on and "
+                                           "the\nsystem's hostid is not set. "
+                                           "Set a unique system hostid with "
+                                           "the zgenhostid(8) command.\n"));
+                               }
+
+                               (void) zfs_error_aux(hdl, aux);
+                       }
+                       (void) zfs_error(hdl, EZFS_ACTIVE_POOL, desc);
+                       break;
+
                 case EINVAL:
                         (void) zfs_error(hdl, EZFS_INVALCONFIG, desc);
                         break;
@@ -1475,18 +1884,46 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                         (void) zfs_error(hdl, EZFS_BADDEV, desc);
                         break;
  
-               default:
-                       (void) zcmd_read_dst_nvlist(hdl, &zc, &nvi);
-                       (void) zpool_standard_error(hdl, errno, desc);
-                       zpool_explain_recover(hdl,
-                           newname ? origname : thename, -errno, nvi);
-                       nvlist_free(nvi);
+               case ENXIO:
+                       if (nv && nvlist_lookup_nvlist(nv,
+                           ZPOOL_CONFIG_LOAD_INFO, &nvinfo) == 0 &&
+                           nvlist_lookup_nvlist(nvinfo,
+                           ZPOOL_CONFIG_MISSING_DEVICES, &missing) == 0) {
+                               (void) printf(dgettext(TEXT_DOMAIN,
+                                   "The devices below are missing, use "
+                                   "'-m' to import the pool anyway:\n"));
+                               print_vdev_tree(hdl, NULL, missing, 2);
+                               (void) printf("\n");
+                       }
+                       (void) zpool_standard_error(hdl, error, desc);
                         break;
-               }
  
-               ret = -1;
-       } else {
-               zpool_handle_t *zhp;
+               case EEXIST:
+                       (void) zpool_standard_error(hdl, error, desc);
+                       break;
+
+               case EBUSY:
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "one or more devices are already in use\n"));
+                       (void) zfs_error(hdl, EZFS_BADDEV, desc);
+                       break;
+               case ENAMETOOLONG:
+                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                           "new name of at least one dataset is longer than "
+                           "the maximum allowable length"));
+                       (void) zfs_error(hdl, EZFS_NAMETOOLONG, desc);
+                       break;
+               default:
+                       (void) zpool_standard_error(hdl, error, desc);
+                       zpool_explain_recover(hdl,
+                           newname ? origname : thename, -error, nv);
+                       break;
+               }
+
+               nvlist_free(nv);
+               ret = -1;
+       } else {
+               zpool_handle_t *zhp;
  
                 /*
                  * This should never fail, but play it safe anyway.
@@ -1495,21 +1932,15 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
                         ret = -1;
                 else if (zhp != NULL)
                         zpool_close(zhp);
-               (void) zcmd_read_dst_nvlist(hdl, &zc, &nvi);
-               zpool_get_rewind_policy(config, &policy);
                 if (policy.zrp_request &
                     (ZPOOL_DO_REWIND | ZPOOL_TRY_REWIND)) {
                         zpool_rewind_exclaim(hdl, newname ? origname : thename,
-                           ((policy.zrp_request & ZPOOL_TRY_REWIND) != 0),
-                           nvi);
+                           ((policy.zrp_request & ZPOOL_TRY_REWIND) != 0), nv);
                 }
-               nvlist_free(nvi);
+               nvlist_free(nv);
                 return (0);
         }
  
-       zcmd_free_nvlists(&zc);
-       nvlist_free(props);
-
         return (ret);
  }
  
@@ -1517,22 +1948,39 @@ zpool_import_props(libzfs_handle_t *hdl, nvlist_t *config, const char *newname,
   * Scan the pool.
   */
  int
-zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
+zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func, pool_scrub_cmd_t cmd)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
+       int err;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_cookie = func;
+       zc.zc_flags = cmd;
  
-       if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_POOL_SCAN, &zc) == 0 ||
-           (errno == ENOENT && func != POOL_SCAN_NONE))
+       if (zfs_ioctl(hdl, ZFS_IOC_POOL_SCAN, &zc) == 0)
+               return (0);
+
+       err = errno;
+
+       /* ECANCELED on a scrub means we resumed a paused scrub */
+       if (err == ECANCELED && func == POOL_SCAN_SCRUB &&
+           cmd == POOL_SCRUB_NORMAL)
+               return (0);
+
+       if (err == ENOENT && func != POOL_SCAN_NONE && cmd == POOL_SCRUB_NORMAL)
                 return (0);
  
         if (func == POOL_SCAN_SCRUB) {
-               (void) snprintf(msg, sizeof (msg),
-                   dgettext(TEXT_DOMAIN, "cannot scrub %s"), zc.zc_name);
+               if (cmd == POOL_SCRUB_PAUSE) {
+                       (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
+                           "cannot pause scrubbing %s"), zc.zc_name);
+               } else {
+                       assert(cmd == POOL_SCRUB_NORMAL);
+                       (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
+                           "cannot scrub %s"), zc.zc_name);
+               }
         } else if (func == POOL_SCAN_NONE) {
                 (void) snprintf(msg, sizeof (msg),
                     dgettext(TEXT_DOMAIN, "cannot cancel scrubbing %s"),
@@ -1541,7 +1989,7 @@ zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
                 assert(!"unexpected result");
         }
  
-       if (errno == EBUSY) {
+       if (err == EBUSY) {
                 nvlist_t *nvroot;
                 pool_scan_stat_t *ps = NULL;
                 uint_t psc;
@@ -1550,49 +1998,21 @@ zpool_scan(zpool_handle_t *zhp, pool_scan_func_t func)
                     ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
                 (void) nvlist_lookup_uint64_array(nvroot,
                     ZPOOL_CONFIG_SCAN_STATS, (uint64_t **)&ps, &psc);
-               if (ps && ps->pss_func == POOL_SCAN_SCRUB)
-                       return (zfs_error(hdl, EZFS_SCRUBBING, msg));
-               else
+               if (ps && ps->pss_func == POOL_SCAN_SCRUB) {
+                       if (cmd == POOL_SCRUB_PAUSE)
+                               return (zfs_error(hdl, EZFS_SCRUB_PAUSED, msg));
+                       else
+                               return (zfs_error(hdl, EZFS_SCRUBBING, msg));
+               } else {
                         return (zfs_error(hdl, EZFS_RESILVERING, msg));
-       } else if (errno == ENOENT) {
+               }
+       } else if (err == ENOENT) {
                 return (zfs_error(hdl, EZFS_NO_SCRUB, msg));
         } else {
-               return (zpool_standard_error(hdl, errno, msg));
+               return (zpool_standard_error(hdl, err, msg));
         }
  }
  
-/*
- * This provides a very minimal check whether a given string is likely a
- * c#t#d# style string.  Users of this are expected to do their own
- * verification of the s# part.
- */
-#define        CTD_CHECK(str)  (str && str[0] == 'c' && isdigit(str[1]))
-
-/*
- * More elaborate version for ones which may start with "/dev/dsk/"
- * and the like.
- */
-static int
-ctd_check_path(char *str) {
-       /*
-        * If it starts with a slash, check the last component.
-        */
-       if (str && str[0] == '/') {
-               char *tmp = strrchr(str, '/');
-
-               /*
-                * If it ends in "/old", check the second-to-last
-                * component of the string instead.
-                */
-               if (tmp != str && strcmp(tmp, "/old") == 0) {
-                       for (tmp--; *tmp != '/'; tmp--)
-                               ;
-               }
-               str = tmp + 1;
-       }
-       return (CTD_CHECK(str));
-}
-
  /*
   * Find a vdev that matches the search criteria specified. We use the
   * the nvpair name to determine how we should look for the device.
@@ -1618,26 +2038,17 @@ vdev_to_nvlist_iter(nvlist_t *nv, nvlist_t *search, boolean_t *avail_spare,
         srchkey = nvpair_name(pair);
  
         switch (nvpair_type(pair)) {
-       case DATA_TYPE_UINT64: {
-               uint64_t srchval, theguid, present;
-
-               verify(nvpair_value_uint64(pair, &srchval) == 0);
+       case DATA_TYPE_UINT64:
                 if (strcmp(srchkey, ZPOOL_CONFIG_GUID) == 0) {
-                       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NOT_PRESENT,
-                           &present) == 0) {
-                               /*
-                                * If the device has never been present since
-                                * import, the only reliable way to match the
-                                * vdev is by GUID.
-                                */
-                               verify(nvlist_lookup_uint64(nv,
-                                   ZPOOL_CONFIG_GUID, &theguid) == 0);
-                               if (theguid == srchval)
-                                       return (nv);
-                       }
+                       uint64_t srchval, theguid;
+
+                       verify(nvpair_value_uint64(pair, &srchval) == 0);
+                       verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID,
+                           &theguid) == 0);
+                       if (theguid == srchval)
+                               return (nv);
                 }
                 break;
-       }
  
         case DATA_TYPE_STRING: {
                 char *srchval, *val;
@@ -1650,50 +2061,22 @@ vdev_to_nvlist_iter(nvlist_t *nv, nvlist_t *search, boolean_t *avail_spare,
                  * Search for the requested value. Special cases:
                  *
                  * - ZPOOL_CONFIG_PATH for whole disk entries.  These end in
-                *   "s0" or "s0/old".  The "s0" part is hidden from the user,
+                *   "-part1", or "p1".  The suffix is hidden from the user,
                  *   but included in the string, so this matches around it.
+                * - ZPOOL_CONFIG_PATH for short names zfs_strcmp_shortname()
+                *   is used to check all possible expanded paths.
                  * - looking for a top-level vdev name (i.e. ZPOOL_CONFIG_TYPE).
                  *
                  * Otherwise, all other searches are simple string compares.
                  */
-               if (strcmp(srchkey, ZPOOL_CONFIG_PATH) == 0 &&
-                   ctd_check_path(val)) {
+               if (strcmp(srchkey, ZPOOL_CONFIG_PATH) == 0) {
                         uint64_t wholedisk = 0;
  
                         (void) nvlist_lookup_uint64(nv, ZPOOL_CONFIG_WHOLE_DISK,
                             &wholedisk);
-                       if (wholedisk) {
-                               int slen = strlen(srchval);
-                               int vlen = strlen(val);
-
-                               if (slen != vlen - 2)
-                                       break;
-
-                               /*
-                                * make_leaf_vdev() should only set
-                                * wholedisk for ZPOOL_CONFIG_PATHs which
-                                * will include "/dev/dsk/", giving plenty of
-                                * room for the indices used next.
-                                */
-                               ASSERT(vlen >= 6);
-
-                               /*
-                                * strings identical except trailing "s0"
-                                */
-                               if (strcmp(&val[vlen - 2], "s0") == 0 &&
-                                   strncmp(srchval, val, slen) == 0)
-                                       return (nv);
-
-                               /*
-                                * strings identical except trailing "s0/old"
-                                */
-                               if (strcmp(&val[vlen - 6], "s0/old") == 0 &&
-                                   strcmp(&srchval[slen - 4], "/old") == 0 &&
-                                   strncmp(srchval, val, slen - 4) == 0)
-                                       return (nv);
+                       if (zfs_strcmp_pathname(srchval, val, wholedisk) == 0)
+                               return (nv);
  
-                               break;
-                       }
                 } else if (strcmp(srchkey, ZPOOL_CONFIG_TYPE) == 0 && val) {
                         char *type, *idx, *end, *p;
                         uint64_t id, vdev_id;
@@ -1819,6 +2202,9 @@ zpool_find_vdev_by_physpath(zpool_handle_t *zhp, const char *ppath,
             &nvroot) == 0);
  
         *avail_spare = B_FALSE;
+       *l2cache = B_FALSE;
+       if (log != NULL)
+               *log = B_FALSE;
         ret = vdev_to_nvlist_iter(nvroot, search, avail_spare, l2cache, log);
         nvlist_free(search);
  
@@ -1841,21 +2227,17 @@ nvlist_t *
  zpool_find_vdev(zpool_handle_t *zhp, const char *path, boolean_t *avail_spare,
      boolean_t *l2cache, boolean_t *log)
  {
-       char buf[MAXPATHLEN];
         char *end;
         nvlist_t *nvroot, *search, *ret;
         uint64_t guid;
  
         verify(nvlist_alloc(&search, NV_UNIQUE_NAME, KM_SLEEP) == 0);
  
-       guid = strtoull(path, &end, 10);
+       guid = strtoull(path, &end, 0);
         if (guid != 0 && *end == '\0') {
                 verify(nvlist_add_uint64(search, ZPOOL_CONFIG_GUID, guid) == 0);
         } else if (zpool_vdev_is_interior(path)) {
                 verify(nvlist_add_string(search, ZPOOL_CONFIG_TYPE, path) == 0);
-       } else if (path[0] != '/') {
-               (void) snprintf(buf, sizeof (buf), "%s%s", "/dev/dsk/", path);
-               verify(nvlist_add_string(search, ZPOOL_CONFIG_PATH, buf) == 0);
         } else {
                 verify(nvlist_add_string(search, ZPOOL_CONFIG_PATH, path) == 0);
         }
@@ -1874,7 +2256,7 @@ zpool_find_vdev(zpool_handle_t *zhp, const char *path, boolean_t *avail_spare,
  }
  
  static int
-vdev_online(nvlist_t *nv)
+vdev_is_online(nvlist_t *nv)
  {
         uint64_t ival;
  
@@ -1942,12 +2324,13 @@ vdev_get_physpaths(nvlist_t *nv, char *physpath, size_t phypath_size,
                                 return (EZFS_INVALCONFIG);
                 }
  
-               if (vdev_online(nv)) {
+               if (vdev_is_online(nv)) {
                         if ((ret = vdev_get_one_physpath(nv, physpath,
                             phypath_size, rsz)) != 0)
                                 return (ret);
                 }
         } else if (strcmp(type, VDEV_TYPE_MIRROR) == 0 ||
+           strcmp(type, VDEV_TYPE_RAIDZ) == 0 ||
             strcmp(type, VDEV_TYPE_REPLACING) == 0 ||
             (is_spare = (strcmp(type, VDEV_TYPE_SPARE) == 0))) {
                 nvlist_t **child;
@@ -1994,11 +2377,9 @@ zpool_get_config_physpath(nvlist_t *config, char *physpath, size_t phypath_size)
                 return (EZFS_INVALCONFIG);
  
         /*
-        * root pool can not have EFI labeled disks and can only have
-        * a single top-level vdev.
+        * root pool can only have a single top-level vdev.
          */
-       if (strcmp(type, VDEV_TYPE_ROOT) != 0 || count != 1 ||
-           pool_uses_efi(vdev_root))
+       if (strcmp(type, VDEV_TYPE_ROOT) != 0 || count != 1)
                 return (EZFS_POOL_INVALARG);
  
         (void) vdev_get_physpaths(child[0], physpath, phypath_size, &rsz,
@@ -2027,40 +2408,77 @@ zpool_get_physpath(zpool_handle_t *zhp, char *physpath, size_t phypath_size)
   * the disk to use the new unallocated space.
   */
  static int
-zpool_relabel_disk(libzfs_handle_t *hdl, const char *name)
+zpool_relabel_disk(libzfs_handle_t *hdl, const char *path, const char *msg)
  {
-       char path[MAXPATHLEN];
-       char errbuf[1024];
         int fd, error;
-       int (*_efi_use_whole_disk)(int);
-
-       if ((_efi_use_whole_disk = (int (*)(int))dlsym(RTLD_DEFAULT,
-           "efi_use_whole_disk")) == NULL)
-               return (-1);
-
-       (void) snprintf(path, sizeof (path), "%s/%s", RDISK_ROOT, name);
  
-       if ((fd = open(path, O_RDWR | O_NDELAY)) < 0) {
+       if ((fd = open(path, O_RDWR|O_DIRECT)) < 0) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "cannot "
-                   "relabel '%s': unable to open device"), name);
-               return (zfs_error(hdl, EZFS_OPENFAILED, errbuf));
+                   "relabel '%s': unable to open device: %d"), path, errno);
+               return (zfs_error(hdl, EZFS_OPENFAILED, msg));
         }
  
         /*
          * It's possible that we might encounter an error if the device
          * does not have any unallocated space left. If so, we simply
          * ignore that error and continue on.
+        *
+        * Also, we don't call efi_rescan() - that would just return EBUSY.
+        * The module will do it for us in vdev_disk_open().
          */
-       error = _efi_use_whole_disk(fd);
+       error = efi_use_whole_disk(fd);
+
+       /* Flush the buffers to disk and invalidate the page cache. */
+       (void) fsync(fd);
+       (void) ioctl(fd, BLKFLSBUF);
+
         (void) close(fd);
         if (error && error != VT_ENOSPC) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "cannot "
-                   "relabel '%s': unable to read disk capacity"), name);
-               return (zfs_error(hdl, EZFS_NOCAP, errbuf));
+                   "relabel '%s': unable to read disk capacity"), path);
+               return (zfs_error(hdl, EZFS_NOCAP, msg));
         }
+
         return (0);
  }
  
+/*
+ * Convert a vdev path to a GUID.  Returns GUID or 0 on error.
+ *
+ * If is_spare, is_l2cache, or is_log is non-NULL, then store within it
+ * if the VDEV is a spare, l2cache, or log device.  If they're NULL then
+ * ignore them.
+ */
+static uint64_t
+zpool_vdev_path_to_guid_impl(zpool_handle_t *zhp, const char *path,
+    boolean_t *is_spare, boolean_t *is_l2cache, boolean_t *is_log)
+{
+       uint64_t guid;
+       boolean_t spare = B_FALSE, l2cache = B_FALSE, log = B_FALSE;
+       nvlist_t *tgt;
+
+       if ((tgt = zpool_find_vdev(zhp, path, &spare, &l2cache,
+           &log)) == NULL)
+               return (0);
+
+       verify(nvlist_lookup_uint64(tgt, ZPOOL_CONFIG_GUID, &guid) == 0);
+       if (is_spare != NULL)
+               *is_spare = spare;
+       if (is_l2cache != NULL)
+               *is_l2cache = l2cache;
+       if (is_log != NULL)
+               *is_log = log;
+
+       return (guid);
+}
+
+/* Convert a vdev path to a GUID.  Returns GUID or 0 on error. */
+uint64_t
+zpool_vdev_path_to_guid(zpool_handle_t *zhp, const char *path)
+{
+       return (zpool_vdev_path_to_guid_impl(zhp, path, NULL, NULL, NULL));
+}
+
  /*
   * Bring the specified vdev online.   The 'flags' parameter is a set of the
   * ZFS_ONLINE_* flags.
@@ -2069,11 +2487,12 @@ int
  zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
      vdev_state_t *newstate)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache, islog;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
+       int error;
  
         if (flags & ZFS_ONLINE_EXPAND) {
                 (void) snprintf(msg, sizeof (msg),
@@ -2095,13 +2514,10 @@ zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
  
         if (flags & ZFS_ONLINE_EXPAND ||
             zpool_get_prop_int(zhp, ZPOOL_PROP_AUTOEXPAND, NULL)) {
-               char *pathname = NULL;
                 uint64_t wholedisk = 0;
  
                 (void) nvlist_lookup_uint64(tgt, ZPOOL_CONFIG_WHOLE_DISK,
                     &wholedisk);
-               verify(nvlist_lookup_string(tgt, ZPOOL_CONFIG_PATH,
-                   &pathname) == 0);
  
                 /*
                  * XXX - L2ARC 1.0 devices can't support expansion.
@@ -2113,15 +2529,29 @@ zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
                 }
  
                 if (wholedisk) {
-                       pathname += strlen(DISK_ROOT) + 1;
-                       (void) zpool_relabel_disk(zhp->zpool_hdl, pathname);
+                       const char *fullpath = path;
+                       char buf[MAXPATHLEN];
+
+                       if (path[0] != '/') {
+                               error = zfs_resolve_shortname(path, buf,
+                                   sizeof (buf));
+                               if (error != 0)
+                                       return (zfs_error(hdl, EZFS_NODEVICE,
+                                           msg));
+
+                               fullpath = buf;
+                       }
+
+                       error = zpool_relabel_disk(hdl, fullpath, msg);
+                       if (error != 0)
+                               return (error);
                 }
         }
  
         zc.zc_cookie = VDEV_STATE_ONLINE;
         zc.zc_obj = flags;
  
-       if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_VDEV_SET_STATE, &zc) != 0) {
+       if (zfs_ioctl(hdl, ZFS_IOC_VDEV_SET_STATE, &zc) != 0) {
                 if (errno == EINVAL) {
                         zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "was split "
                             "from this pool into a new one.  Use '%s' "
@@ -2141,7 +2571,7 @@ zpool_vdev_online(zpool_handle_t *zhp, const char *path, int flags,
  int
  zpool_vdev_offline(zpool_handle_t *zhp, const char *path, boolean_t istmp)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache;
@@ -2163,7 +2593,7 @@ zpool_vdev_offline(zpool_handle_t *zhp, const char *path, boolean_t istmp)
         zc.zc_cookie = VDEV_STATE_OFFLINE;
         zc.zc_obj = istmp ? ZFS_OFFLINE_TEMPORARY : 0;
  
-       if (zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
+       if (zfs_ioctl(hdl, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
                 return (0);
  
         switch (errno) {
@@ -2191,19 +2621,19 @@ zpool_vdev_offline(zpool_handle_t *zhp, const char *path, boolean_t istmp)
  int
  zpool_vdev_fault(zpool_handle_t *zhp, uint64_t guid, vdev_aux_t aux)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) snprintf(msg, sizeof (msg),
-           dgettext(TEXT_DOMAIN, "cannot fault %llu"), guid);
+           dgettext(TEXT_DOMAIN, "cannot fault %llu"), (u_longlong_t)guid);
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_guid = guid;
         zc.zc_cookie = VDEV_STATE_FAULTED;
         zc.zc_obj = aux;
  
-       if (ioctl(zhp->zpool_hdl->libzfs_fd, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
+       if (ioctl(hdl->libzfs_fd, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
                 return (0);
  
         switch (errno) {
@@ -2226,19 +2656,19 @@ zpool_vdev_fault(zpool_handle_t *zhp, uint64_t guid, vdev_aux_t aux)
  int
  zpool_vdev_degrade(zpool_handle_t *zhp, uint64_t guid, vdev_aux_t aux)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) snprintf(msg, sizeof (msg),
-           dgettext(TEXT_DOMAIN, "cannot degrade %llu"), guid);
+           dgettext(TEXT_DOMAIN, "cannot degrade %llu"), (u_longlong_t)guid);
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_guid = guid;
         zc.zc_cookie = VDEV_STATE_DEGRADED;
         zc.zc_obj = aux;
  
-       if (ioctl(zhp->zpool_hdl->libzfs_fd, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
+       if (ioctl(hdl->libzfs_fd, ZFS_IOC_VDEV_SET_STATE, &zc) == 0)
                 return (0);
  
         return (zpool_standard_error(hdl, errno, msg));
@@ -2280,18 +2710,18 @@ int
  zpool_vdev_attach(zpool_handle_t *zhp,
      const char *old_disk, const char *new_disk, nvlist_t *nvroot, int replacing)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         int ret;
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache, islog;
         uint64_t val;
-       char *path, *newname;
+       char *newname;
         nvlist_t **child;
         uint_t children;
         nvlist_t *config_root;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
-       boolean_t rootpool = pool_is_bootable(zhp);
+       boolean_t rootpool = zpool_is_bootable(zhp);
  
         if (replacing)
                 (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
@@ -2300,16 +2730,6 @@ zpool_vdev_attach(zpool_handle_t *zhp,
                 (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
                     "cannot attach %s to %s"), new_disk, old_disk);
  
-       /*
-        * If this is a root pool, make sure that we're not attaching an
-        * EFI labeled device.
-        */
-       if (rootpool && pool_uses_efi(nvroot)) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "EFI labeled devices are not supported on root pools."));
-               return (zfs_error(hdl, EZFS_POOL_NOTSUP, msg));
-       }
-
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         if ((tgt = zpool_find_vdev(zhp, old_disk, &avail_spare, &l2cache,
             &islog)) == 0)
@@ -2334,7 +2754,7 @@ zpool_vdev_attach(zpool_handle_t *zhp,
         verify(nvlist_lookup_nvlist(zpool_get_config(zhp, NULL),
             ZPOOL_CONFIG_VDEV_TREE, &config_root) == 0);
  
-       if ((newname = zpool_vdev_name(NULL, NULL, child[0], B_FALSE)) == NULL)
+       if ((newname = zpool_vdev_name(NULL, NULL, child[0], 0)) == NULL)
                 return (-1);
  
         /*
@@ -2352,41 +2772,17 @@ zpool_vdev_attach(zpool_handle_t *zhp,
                 return (zfs_error(hdl, EZFS_BADTARGET, msg));
         }
  
-       /*
-        * If we are attempting to replace a spare, it canot be applied to an
-        * already spared device.
-        */
-       if (replacing &&
-           nvlist_lookup_string(child[0], ZPOOL_CONFIG_PATH, &path) == 0 &&
-           zpool_find_vdev(zhp, newname, &avail_spare,
-           &l2cache, NULL) != NULL && avail_spare &&
-           is_replacing_spare(config_root, tgt, 0)) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "device has already been replaced with a spare"));
-               free(newname);
-               return (zfs_error(hdl, EZFS_BADTARGET, msg));
-       }
-
         free(newname);
  
         if (zcmd_write_conf_nvlist(hdl, &zc, nvroot) != 0)
                 return (-1);
  
-       ret = zfs_ioctl(zhp->zpool_hdl, ZFS_IOC_VDEV_ATTACH, &zc);
+       ret = zfs_ioctl(hdl, ZFS_IOC_VDEV_ATTACH, &zc);
  
         zcmd_free_nvlists(&zc);
  
         if (ret == 0) {
                 if (rootpool) {
-                       /*
-                        * XXX - This should be removed once we can
-                        * automatically install the bootblocks on the
-                        * newly attached disk.
-                        */
-                       (void) fprintf(stderr, dgettext(TEXT_DOMAIN, "Please "
-                           "be sure to invoke %s to make '%s' bootable.\n"),
-                           BOOTCMD, new_disk);
-
                         /*
                          * XXX need a better way to prevent user from
                          * booting up a half-baked vdev.
@@ -2404,9 +2800,16 @@ zpool_vdev_attach(zpool_handle_t *zhp,
                  * Can't attach to or replace this type of vdev.
                  */
                 if (replacing) {
+                       uint64_t version = zpool_get_prop_int(zhp,
+                           ZPOOL_PROP_VERSION, NULL);
+
                         if (islog)
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "cannot replace a log with a spare"));
+                       else if (version >= SPA_VERSION_MULTI_REPLACE)
+                               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
+                                   "already in replacing/spare config; wait "
+                                   "for completion or use 'zpool detach'"));
                         else
                                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                                     "cannot replace a replacing device"));
@@ -2444,10 +2847,11 @@ zpool_vdev_attach(zpool_handle_t *zhp,
  
         case EDOM:
                 /*
-                * The new device has a different alignment requirement.
+                * The new device has a different optimal sector size.
                  */
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "devices have different sector alignment"));
+                   "new device has a different optimal sector size; use the "
+                   "option '-o ashift=N' to override the optimal size"));
                 (void) zfs_error(hdl, EZFS_BADDEV, msg);
                 break;
  
@@ -2471,7 +2875,7 @@ zpool_vdev_attach(zpool_handle_t *zhp,
  int
  zpool_vdev_detach(zpool_handle_t *zhp, const char *path)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache;
@@ -2504,7 +2908,7 @@ zpool_vdev_detach(zpool_handle_t *zhp, const char *path)
                  */
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "only "
                     "applicable to mirror and replacing vdevs"));
-               (void) zfs_error(zhp->zpool_hdl, EZFS_BADTARGET, msg);
+               (void) zfs_error(hdl, EZFS_BADTARGET, msg);
                 break;
  
         case EBUSY:
@@ -2541,11 +2945,11 @@ find_vdev_entry(zpool_handle_t *zhp, nvlist_t **mchild, uint_t mchildren,
         for (mc = 0; mc < mchildren; mc++) {
                 uint_t sc;
                 char *mpath = zpool_vdev_name(zhp->zpool_hdl, zhp,
-                   mchild[mc], B_FALSE);
+                   mchild[mc], 0);
  
                 for (sc = 0; sc < schildren; sc++) {
                         char *spath = zpool_vdev_name(zhp->zpool_hdl, zhp,
-                           schild[sc], B_FALSE);
+                           schild[sc], 0);
                         boolean_t result = (strcmp(mpath, spath) == 0);
  
                         free(spath);
@@ -2569,7 +2973,7 @@ int
  zpool_vdev_split(zpool_handle_t *zhp, char *newname, nvlist_t **newroot,
      nvlist_t *props, splitflags_t flags)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tree, *config, **child, **newchild, *newconfig = NULL;
         nvlist_t **varray = NULL, *zc_props = NULL;
@@ -2596,8 +3000,9 @@ zpool_vdev_split(zpool_handle_t *zhp, char *newname, nvlist_t **newroot,
         verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_VERSION, &vers) == 0);
  
         if (props) {
+               prop_flags_t flags = { .create = B_FALSE, .import = B_TRUE };
                 if ((zc_props = zpool_valid_proplist(hdl, zhp->zpool_name,
-                   props, vers, B_TRUE, msg)) == NULL)
+                   props, vers, flags, msg)) == NULL)
                         return (-1);
         }
  
@@ -2605,8 +3010,7 @@ zpool_vdev_split(zpool_handle_t *zhp, char *newname, nvlist_t **newroot,
             &children) != 0) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
                     "Source pool is missing vdev tree"));
-               if (zc_props)
-                       nvlist_free(zc_props);
+               nvlist_free(zc_props);
                 return (-1);
         }
  
@@ -2754,10 +3158,8 @@ out:
                 free(varray);
         }
         zcmd_free_nvlists(&zc);
-       if (zc_props)
-               nvlist_free(zc_props);
-       if (newconfig)
-               nvlist_free(newconfig);
+       nvlist_free(zc_props);
+       nvlist_free(newconfig);
         if (freelist) {
                 nvlist_free(*newroot);
                 *newroot = NULL;
@@ -2773,13 +3175,13 @@ out:
  }
  
  /*
- * Remove the given device.  Currently, this is supported only for hot spares
- * and level 2 cache devices.
+ * Remove the given device.  Currently, this is supported only for hot spares,
+ * cache, and log devices.
   */
  int
  zpool_vdev_remove(zpool_handle_t *zhp, const char *path)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tgt;
         boolean_t avail_spare, l2cache, islog;
@@ -2798,7 +3200,7 @@ zpool_vdev_remove(zpool_handle_t *zhp, const char *path)
          */
         if (!avail_spare && !l2cache && !islog) {
                 zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "only inactive hot spares, cache, top-level, "
+                   "only inactive hot spares, cache, "
                     "or log devices can be removed"));
                 return (zfs_error(hdl, EZFS_NODEVICE, msg));
         }
@@ -2824,13 +3226,14 @@ zpool_vdev_remove(zpool_handle_t *zhp, const char *path)
  int
  zpool_clear(zpool_handle_t *zhp, const char *path, nvlist_t *rewindnvl)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         nvlist_t *tgt;
         zpool_rewind_policy_t policy;
         boolean_t avail_spare, l2cache;
         libzfs_handle_t *hdl = zhp->zpool_hdl;
         nvlist_t *nvi = NULL;
+       int error;
  
         if (path)
                 (void) snprintf(msg, sizeof (msg),
@@ -2861,14 +3264,21 @@ zpool_clear(zpool_handle_t *zhp, const char *path, nvlist_t *rewindnvl)
         zpool_get_rewind_policy(rewindnvl, &policy);
         zc.zc_cookie = policy.zrp_request;
  
-       if (zcmd_alloc_dst_nvlist(hdl, &zc, 8192) != 0)
+       if (zcmd_alloc_dst_nvlist(hdl, &zc, zhp->zpool_config_size * 2) != 0)
                 return (-1);
  
-       if (zcmd_write_src_nvlist(zhp->zpool_hdl, &zc, rewindnvl) != 0)
+       if (zcmd_write_src_nvlist(hdl, &zc, rewindnvl) != 0)
                 return (-1);
  
-       if (zfs_ioctl(hdl, ZFS_IOC_CLEAR, &zc) == 0 ||
-           ((policy.zrp_request & ZPOOL_TRY_REWIND) &&
+       while ((error = zfs_ioctl(hdl, ZFS_IOC_CLEAR, &zc)) != 0 &&
+           errno == ENOMEM) {
+               if (zcmd_expand_dst_nvlist(hdl, &zc) != 0) {
+                       zcmd_free_nvlists(&zc);
+                       return (-1);
+               }
+       }
+
+       if (!error || ((policy.zrp_request & ZPOOL_TRY_REWIND) &&
             errno != EPERM && errno != EACCES)) {
                 if (policy.zrp_request &
                     (ZPOOL_DO_REWIND | ZPOOL_TRY_REWIND)) {
@@ -2892,13 +3302,13 @@ zpool_clear(zpool_handle_t *zhp, const char *path, nvlist_t *rewindnvl)
  int
  zpool_vdev_clear(zpool_handle_t *zhp, uint64_t guid)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         char msg[1024];
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) snprintf(msg, sizeof (msg),
             dgettext(TEXT_DOMAIN, "cannot clear errors for %llx"),
-           guid);
+           (u_longlong_t)guid);
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         zc.zc_guid = guid;
@@ -2910,6 +3320,68 @@ zpool_vdev_clear(zpool_handle_t *zhp, uint64_t guid)
         return (zpool_standard_error(hdl, errno, msg));
  }
  
+/*
+ * Change the GUID for a pool.
+ */
+int
+zpool_reguid(zpool_handle_t *zhp)
+{
+       char msg[1024];
+       libzfs_handle_t *hdl = zhp->zpool_hdl;
+       zfs_cmd_t zc = {"\0"};
+
+       (void) snprintf(msg, sizeof (msg),
+           dgettext(TEXT_DOMAIN, "cannot reguid '%s'"), zhp->zpool_name);
+
+       (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
+       if (zfs_ioctl(hdl, ZFS_IOC_POOL_REGUID, &zc) == 0)
+               return (0);
+
+       return (zpool_standard_error(hdl, errno, msg));
+}
+
+/*
+ * Reopen the pool.
+ */
+int
+zpool_reopen(zpool_handle_t *zhp)
+{
+       zfs_cmd_t zc = {"\0"};
+       char msg[1024];
+       libzfs_handle_t *hdl = zhp->zpool_hdl;
+
+       (void) snprintf(msg, sizeof (msg),
+           dgettext(TEXT_DOMAIN, "cannot reopen '%s'"),
+           zhp->zpool_name);
+
+       (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
+       if (zfs_ioctl(hdl, ZFS_IOC_POOL_REOPEN, &zc) == 0)
+               return (0);
+       return (zpool_standard_error(hdl, errno, msg));
+}
+
+/* call into libzfs_core to execute the sync IOCTL per pool */
+int
+zpool_sync_one(zpool_handle_t *zhp, void *data)
+{
+       int ret;
+       libzfs_handle_t *hdl = zpool_get_handle(zhp);
+       const char *pool_name = zpool_get_name(zhp);
+       boolean_t *force = data;
+       nvlist_t *innvl = fnvlist_alloc();
+
+       fnvlist_add_boolean_value(innvl, "force", *force);
+       if ((ret = lzc_sync(pool_name, innvl, NULL)) != 0) {
+               nvlist_free(innvl);
+               return (zpool_standard_error_fmt(hdl, ret,
+                   dgettext(TEXT_DOMAIN, "sync '%s' failed"), pool_name));
+       }
+       nvlist_free(innvl);
+
+       return (0);
+}
+
+#if defined(__sun__) || defined(__sun)
  /*
   * Convert from a devid string to a path.
   */
@@ -2933,8 +3405,10 @@ devid_to_path(char *devid_str)
         if (ret != 0)
                 return (NULL);
  
-       if ((path = strdup(list[0].devname)) == NULL)
-               return (NULL);
+       /*
+        * In a case the strdup() fails, we will just return NULL below.
+        */
+       path = strdup(list[0].devname);
  
         devid_free_nmlist(list);
  
@@ -2976,7 +3450,7 @@ path_to_devid(const char *path)
  static void
  set_path(zpool_handle_t *zhp, nvlist_t *nv, const char *path)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
  
         (void) strncpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
         (void) strncpy(zc.zc_value, path, sizeof (zc.zc_value));
@@ -2985,6 +3459,83 @@ set_path(zpool_handle_t *zhp, nvlist_t *nv, const char *path)
  
         (void) ioctl(zhp->zpool_hdl->libzfs_fd, ZFS_IOC_VDEV_SETPATH, &zc);
  }
+#endif /* sun */
+
+/*
+ * Remove partition suffix from a vdev path.  Partition suffixes may take three
+ * forms: "-partX", "pX", or "X", where X is a string of digits.  The second
+ * case only occurs when the suffix is preceded by a digit, i.e. "md0p0" The
+ * third case only occurs when preceded by a string matching the regular
+ * expression "^([hsv]|xv)d[a-z]+", i.e. a scsi, ide, virtio or xen disk.
+ *
+ * caller must free the returned string
+ */
+char *
+zfs_strip_partition(char *path)
+{
+       char *tmp = strdup(path);
+       char *part = NULL, *d = NULL;
+       if (!tmp)
+               return (NULL);
+
+       if ((part = strstr(tmp, "-part")) && part != tmp) {
+               d = part + 5;
+       } else if ((part = strrchr(tmp, 'p')) &&
+           part > tmp + 1 && isdigit(*(part-1))) {
+               d = part + 1;
+       } else if ((tmp[0] == 'h' || tmp[0] == 's' || tmp[0] == 'v') &&
+           tmp[1] == 'd') {
+               for (d = &tmp[2]; isalpha(*d); part = ++d) { }
+       } else if (strncmp("xvd", tmp, 3) == 0) {
+               for (d = &tmp[3]; isalpha(*d); part = ++d) { }
+       }
+       if (part && d && *d != '\0') {
+               for (; isdigit(*d); d++) { }
+               if (*d == '\0')
+                       *part = '\0';
+       }
+
+       return (tmp);
+}
+
+/*
+ * Same as zfs_strip_partition, but allows "/dev/" to be in the pathname
+ *
+ * path:       /dev/sda1
+ * returns:    /dev/sda
+ *
+ * Returned string must be freed.
+ */
+char *
+zfs_strip_partition_path(char *path)
+{
+       char *newpath = strdup(path);
+       char *sd_offset;
+       char *new_sd;
+
+       if (!newpath)
+               return (NULL);
+
+       /* Point to "sda1" part of "/dev/sda1" */
+       sd_offset = strrchr(newpath, '/') + 1;
+
+       /* Get our new name "sda" */
+       new_sd = zfs_strip_partition(sd_offset);
+       if (!new_sd) {
+               free(newpath);
+               return (NULL);
+       }
+
+       /* Paste the "sda" where "sda1" was */
+       strlcpy(sd_offset, new_sd, strlen(sd_offset) + 1);
+
+       /* Free temporary "sda" */
+       free(new_sd);
+
+       return (newpath);
+}
+
+#define        PATH_BUF_LEN    64
  
  /*
   * Given a vdev, return the name to display in iostat.  If the vdev has a path,
@@ -3003,22 +3554,42 @@ set_path(zpool_handle_t *zhp, nvlist_t *nv, const char *path)
   */
  char *
  zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
-    boolean_t verbose)
+    int name_flags)
  {
-       char *path, *devid;
+       char *path, *type, *env;
         uint64_t value;
-       char buf[64];
-       vdev_stat_t *vs;
-       uint_t vsc;
-
-       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NOT_PRESENT,
-           &value) == 0) {
-               verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID,
-                   &value) == 0);
-               (void) snprintf(buf, sizeof (buf), "%llu",
-                   (u_longlong_t)value);
+       char buf[PATH_BUF_LEN];
+       char tmpbuf[PATH_BUF_LEN];
+
+       env = getenv("ZPOOL_VDEV_NAME_PATH");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_PATH;
+
+       env = getenv("ZPOOL_VDEV_NAME_GUID");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_GUID;
+
+       env = getenv("ZPOOL_VDEV_NAME_FOLLOW_LINKS");
+       if (env && (strtoul(env, NULL, 0) > 0 ||
+           !strncasecmp(env, "YES", 3) || !strncasecmp(env, "ON", 2)))
+               name_flags |= VDEV_NAME_FOLLOW_LINKS;
+
+       if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_NOT_PRESENT, &value) == 0 ||
+           name_flags & VDEV_NAME_GUID) {
+               (void) nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID, &value);
+               (void) snprintf(buf, sizeof (buf), "%llu", (u_longlong_t)value);
                 path = buf;
         } else if (nvlist_lookup_string(nv, ZPOOL_CONFIG_PATH, &path) == 0) {
+#if defined(__sun__) || defined(__sun)
+               /*
+                * Live VDEV path updates to a kernel VDEV during a
+                * zpool_vdev_name lookup are not supported on Linux.
+                */
+               char *devid;
+               vdev_stat_t *vs;
+               uint_t vsc;
  
                 /*
                  * If the device is dead (faulted, offline, etc) then don't
@@ -3057,30 +3628,33 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
                         if (newdevid)
                                 devid_str_free(newdevid);
                 }
+#endif /* sun */
+
+               if (name_flags & VDEV_NAME_FOLLOW_LINKS) {
+                       char *rp = realpath(path, NULL);
+                       if (rp) {
+                               strlcpy(buf, rp, sizeof (buf));
+                               path = buf;
+                               free(rp);
+                       }
+               }
  
-               if (strncmp(path, "/dev/dsk/", 9) == 0)
-                       path += 9;
-
-               if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_WHOLE_DISK,
-                   &value) == 0 && value) {
-                       int pathlen = strlen(path);
-                       char *tmp = zfs_strdup(hdl, path);
+               /*
+                * For a block device only use the name.
+                */
+               verify(nvlist_lookup_string(nv, ZPOOL_CONFIG_TYPE, &type) == 0);
+               if ((strcmp(type, VDEV_TYPE_DISK) == 0) &&
+                   !(name_flags & VDEV_NAME_PATH)) {
+                       path = strrchr(path, '/');
+                       path++;
+               }
  
-                       /*
-                        * If it starts with c#, and ends with "s0", chop
-                        * the "s0" off, or if it ends with "s0/old", remove
-                        * the "s0" from the middle.
-                        */
-                       if (CTD_CHECK(tmp)) {
-                               if (strcmp(&tmp[pathlen - 2], "s0") == 0) {
-                                       tmp[pathlen - 2] = '\0';
-                               } else if (pathlen > 6 &&
-                                   strcmp(&tmp[pathlen - 6], "s0/old") == 0) {
-                                       (void) strcpy(&tmp[pathlen - 6],
-                                           "/old");
-                               }
-                       }
-                       return (tmp);
+               /*
+                * Remove the partition from the path it this is a whole disk.
+                */
+               if (nvlist_lookup_uint64(nv, ZPOOL_CONFIG_WHOLE_DISK, &value)
+                   == 0 && value && !(name_flags & VDEV_NAME_PATH)) {
+                       return (zfs_strip_partition(path));
                 }
         } else {
                 verify(nvlist_lookup_string(nv, ZPOOL_CONFIG_TYPE, &path) == 0);
@@ -3100,14 +3674,13 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
                  * We identify each top-level vdev by using a <type-id>
                  * naming convention.
                  */
-               if (verbose) {
+               if (name_flags & VDEV_NAME_TYPE_ID) {
                         uint64_t id;
-
                         verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_ID,
                             &id) == 0);
-                       (void) snprintf(buf, sizeof (buf), "%s-%llu", path,
-                           (u_longlong_t)id);
-                       path = buf;
+                       (void) snprintf(tmpbuf, sizeof (tmpbuf), "%s-%llu",
+                           path, (u_longlong_t)id);
+                       path = tmpbuf;
                 }
         }
  
@@ -3115,9 +3688,9 @@ zpool_vdev_name(libzfs_handle_t *hdl, zpool_handle_t *zhp, nvlist_t *nv,
  }
  
  static int
-zbookmark_compare(const void *a, const void *b)
+zbookmark_mem_compare(const void *a, const void *b)
  {
-       return (memcmp(a, b, sizeof (zbookmark_t)));
+       return (memcmp(a, b, sizeof (zbookmark_phys_t)));
  }
  
  /*
@@ -3127,9 +3700,10 @@ zbookmark_compare(const void *a, const void *b)
  int
  zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
+       libzfs_handle_t *hdl = zhp->zpool_hdl;
         uint64_t count;
-       zbookmark_t *zb = NULL;
+       zbookmark_phys_t *zb = NULL;
         int i;
  
         /*
@@ -3141,9 +3715,8 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
             &count) == 0);
         if (count == 0)
                 return (0);
-       if ((zc.zc_nvlist_dst = (uintptr_t)zfs_alloc(zhp->zpool_hdl,
-           count * sizeof (zbookmark_t))) == (uintptr_t)NULL)
-               return (-1);
+       zc.zc_nvlist_dst = (uintptr_t)zfs_alloc(zhp->zpool_hdl,
+           count * sizeof (zbookmark_phys_t));
         zc.zc_nvlist_dst_size = count;
         (void) strcpy(zc.zc_name, zhp->zpool_name);
         for (;;) {
@@ -3151,13 +3724,16 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
                     &zc) != 0) {
                         free((void *)(uintptr_t)zc.zc_nvlist_dst);
                         if (errno == ENOMEM) {
+                               void *dst;
+
                                 count = zc.zc_nvlist_dst_size;
-                               if ((zc.zc_nvlist_dst = (uintptr_t)
-                                   zfs_alloc(zhp->zpool_hdl, count *
-                                   sizeof (zbookmark_t))) == (uintptr_t)NULL)
-                                       return (-1);
+                               dst = zfs_alloc(zhp->zpool_hdl, count *
+                                   sizeof (zbookmark_phys_t));
+                               zc.zc_nvlist_dst = (uintptr_t)dst;
                         } else {
-                               return (-1);
+                               return (zpool_standard_error_fmt(hdl, errno,
+                                   dgettext(TEXT_DOMAIN, "errors: List of "
+                                   "errors unavailable")));
                         }
                 } else {
                         break;
@@ -3171,11 +3747,11 @@ zpool_get_errlog(zpool_handle_t *zhp, nvlist_t **nverrlistp)
          * _not_ copied as part of the process.  So we point the start of our
          * array appropriate and decrement the total number of elements.
          */
-       zb = ((zbookmark_t *)(uintptr_t)zc.zc_nvlist_dst) +
+       zb = ((zbookmark_phys_t *)(uintptr_t)zc.zc_nvlist_dst) +
             zc.zc_nvlist_dst_size;
         count -= zc.zc_nvlist_dst_size;
  
-       qsort(zb, count, sizeof (zbookmark_t), zbookmark_compare);
+       qsort(zb, count, sizeof (zbookmark_phys_t), zbookmark_mem_compare);
  
         verify(nvlist_alloc(nverrlistp, 0, KM_SLEEP) == 0);
  
@@ -3223,7 +3799,7 @@ nomem:
  int
  zpool_upgrade(zpool_handle_t *zhp, uint64_t new_version)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) strcpy(zc.zc_name, zhp->zpool_name);
@@ -3237,40 +3813,32 @@ zpool_upgrade(zpool_handle_t *zhp, uint64_t new_version)
  }
  
  void
-zpool_set_history_str(const char *subcommand, int argc, char **argv,
-    char *history_str)
+zfs_save_arguments(int argc, char **argv, char *string, int len)
  {
         int i;
  
-       (void) strlcpy(history_str, subcommand, HIS_MAX_RECORD_LEN);
+       (void) strlcpy(string, basename(argv[0]), len);
         for (i = 1; i < argc; i++) {
-               if (strlen(history_str) + 1 + strlen(argv[i]) >
-                   HIS_MAX_RECORD_LEN)
-                       break;
-               (void) strlcat(history_str, " ", HIS_MAX_RECORD_LEN);
-               (void) strlcat(history_str, argv[i], HIS_MAX_RECORD_LEN);
+               (void) strlcat(string, " ", len);
+               (void) strlcat(string, argv[i], len);
         }
  }
  
-/*
- * Stage command history for logging.
- */
  int
-zpool_stage_history(libzfs_handle_t *hdl, const char *history_str)
+zpool_log_history(libzfs_handle_t *hdl, const char *message)
  {
-       if (history_str == NULL)
-               return (EINVAL);
-
-       if (strlen(history_str) > HIS_MAX_RECORD_LEN)
-               return (EINVAL);
-
-       if (hdl->libzfs_log_str != NULL)
-               free(hdl->libzfs_log_str);
-
-       if ((hdl->libzfs_log_str = strdup(history_str)) == NULL)
-               return (no_memory(hdl));
-
-       return (0);
+       zfs_cmd_t zc = {"\0"};
+       nvlist_t *args;
+       int err;
+
+       args = fnvlist_alloc();
+       fnvlist_add_string(args, "message", message);
+       err = zcmd_write_src_nvlist(hdl, &zc, args);
+       if (err == 0)
+               err = ioctl(hdl->libzfs_fd, ZFS_IOC_LOG_HISTORY, &zc);
+       nvlist_free(args);
+       zcmd_free_nvlists(&zc);
+       return (err);
  }
  
  /*
@@ -3285,7 +3853,7 @@ zpool_stage_history(libzfs_handle_t *hdl, const char *history_str)
  static int
  get_history(zpool_handle_t *zhp, char *buf, uint64_t *off, uint64_t *len)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         libzfs_handle_t *hdl = zhp->zpool_hdl;
  
         (void) strlcpy(zc.zc_name, zhp->zpool_name, sizeof (zc.zc_name));
@@ -3334,6 +3902,7 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
         uint64_t reclen;
         nvlist_t *nv;
         int i;
+       void *tmp;
  
         while (bytes_read > sizeof (reclen)) {
  
@@ -3353,8 +3922,14 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
                 /* add record to nvlist array */
                 (*numrecords)++;
                 if (ISP2(*numrecords + 1)) {
-                       *records = realloc(*records,
+                       tmp = realloc(*records,
                             *numrecords * 2 * sizeof (nvlist_t *));
+                       if (tmp == NULL) {
+                               nvlist_free(nv);
+                               (*numrecords)--;
+                               return (ENOMEM);
+                       }
+                       *records = tmp;
                 }
                 (*records)[*numrecords - 1] = nv;
         }
@@ -3363,22 +3938,24 @@ zpool_history_unpack(char *buf, uint64_t bytes_read, uint64_t *leftover,
         return (0);
  }
  
-#define        HIS_BUF_LEN     (128*1024)
-
  /*
   * Retrieve the command history of a pool.
   */
  int
  zpool_get_history(zpool_handle_t *zhp, nvlist_t **nvhisp)
  {
-       char buf[HIS_BUF_LEN];
+       char *buf;
+       int buflen = 128 * 1024;
         uint64_t off = 0;
         nvlist_t **records = NULL;
         uint_t numrecords = 0;
         int err, i;
  
+       buf = malloc(buflen);
+       if (buf == NULL)
+               return (ENOMEM);
         do {
-               uint64_t bytes_read = sizeof (buf);
+               uint64_t bytes_read = buflen;
                 uint64_t leftover;
  
                 if ((err = get_history(zhp, buf, &off, &bytes_read)) != 0)
@@ -3392,10 +3969,23 @@ zpool_get_history(zpool_handle_t *zhp, nvlist_t **nvhisp)
                     &leftover, &records, &numrecords)) != 0)
                         break;
                 off -= leftover;
+               if (leftover == bytes_read) {
+                       /*
+                        * no progress made, because buffer is not big enough
+                        * to hold this record; resize and retry.
+                        */
+                       buflen *= 2;
+                       free(buf);
+                       buf = malloc(buflen);
+                       if (buf == NULL)
+                               return (ENOMEM);
+               }
  
                 /* CONSTCOND */
         } while (1);
  
+       free(buf);
+
         if (!err) {
                 verify(nvlist_alloc(nvhisp, NV_UNIQUE_NAME, 0) == 0);
                 verify(nvlist_add_nvlist_array(*nvhisp, ZPOOL_HIST_RECORD,
@@ -3408,18 +3998,144 @@ zpool_get_history(zpool_handle_t *zhp, nvlist_t **nvhisp)
         return (err);
  }
  
+/*
+ * Retrieve the next event given the passed 'zevent_fd' file descriptor.
+ * If there is a new event available 'nvp' will contain a newly allocated
+ * nvlist and 'dropped' will be set to the number of missed events since
+ * the last call to this function.  When 'nvp' is set to NULL it indicates
+ * no new events are available.  In either case the function returns 0 and
+ * it is up to the caller to free 'nvp'.  In the case of a fatal error the
+ * function will return a non-zero value.  When the function is called in
+ * blocking mode (the default, unless the ZEVENT_NONBLOCK flag is passed),
+ * it will not return until a new event is available.
+ */
+int
+zpool_events_next(libzfs_handle_t *hdl, nvlist_t **nvp,
+    int *dropped, unsigned flags, int zevent_fd)
+{
+       zfs_cmd_t zc = {"\0"};
+       int error = 0;
+
+       *nvp = NULL;
+       *dropped = 0;
+       zc.zc_cleanup_fd = zevent_fd;
+
+       if (flags & ZEVENT_NONBLOCK)
+               zc.zc_guid = ZEVENT_NONBLOCK;
+
+       if (zcmd_alloc_dst_nvlist(hdl, &zc, ZEVENT_SIZE) != 0)
+               return (-1);
+
+retry:
+       if (zfs_ioctl(hdl, ZFS_IOC_EVENTS_NEXT, &zc) != 0) {
+               switch (errno) {
+               case ESHUTDOWN:
+                       error = zfs_error_fmt(hdl, EZFS_POOLUNAVAIL,
+                           dgettext(TEXT_DOMAIN, "zfs shutdown"));
+                       goto out;
+               case ENOENT:
+                       /* Blocking error case should not occur */
+                       if (!(flags & ZEVENT_NONBLOCK))
+                               error = zpool_standard_error_fmt(hdl, errno,
+                                   dgettext(TEXT_DOMAIN, "cannot get event"));
+
+                       goto out;
+               case ENOMEM:
+                       if (zcmd_expand_dst_nvlist(hdl, &zc) != 0) {
+                               error = zfs_error_fmt(hdl, EZFS_NOMEM,
+                                   dgettext(TEXT_DOMAIN, "cannot get event"));
+                               goto out;
+                       } else {
+                               goto retry;
+                       }
+               default:
+                       error = zpool_standard_error_fmt(hdl, errno,
+                           dgettext(TEXT_DOMAIN, "cannot get event"));
+                       goto out;
+               }
+       }
+
+       error = zcmd_read_dst_nvlist(hdl, &zc, nvp);
+       if (error != 0)
+               goto out;
+
+       *dropped = (int)zc.zc_cookie;
+out:
+       zcmd_free_nvlists(&zc);
+
+       return (error);
+}
+
+/*
+ * Clear all events.
+ */
+int
+zpool_events_clear(libzfs_handle_t *hdl, int *count)
+{
+       zfs_cmd_t zc = {"\0"};
+       char msg[1024];
+
+       (void) snprintf(msg, sizeof (msg), dgettext(TEXT_DOMAIN,
+           "cannot clear events"));
+
+       if (zfs_ioctl(hdl, ZFS_IOC_EVENTS_CLEAR, &zc) != 0)
+               return (zpool_standard_error_fmt(hdl, errno, msg));
+
+       if (count != NULL)
+               *count = (int)zc.zc_cookie; /* # of events cleared */
+
+       return (0);
+}
+
+/*
+ * Seek to a specific EID, ZEVENT_SEEK_START, or ZEVENT_SEEK_END for
+ * the passed zevent_fd file handle.  On success zero is returned,
+ * otherwise -1 is returned and hdl->libzfs_error is set to the errno.
+ */
+int
+zpool_events_seek(libzfs_handle_t *hdl, uint64_t eid, int zevent_fd)
+{
+       zfs_cmd_t zc = {"\0"};
+       int error = 0;
+
+       zc.zc_guid = eid;
+       zc.zc_cleanup_fd = zevent_fd;
+
+       if (zfs_ioctl(hdl, ZFS_IOC_EVENTS_SEEK, &zc) != 0) {
+               switch (errno) {
+               case ENOENT:
+                       error = zfs_error_fmt(hdl, EZFS_NOENT,
+                           dgettext(TEXT_DOMAIN, "cannot get event"));
+                       break;
+
+               case ENOMEM:
+                       error = zfs_error_fmt(hdl, EZFS_NOMEM,
+                           dgettext(TEXT_DOMAIN, "cannot get event"));
+                       break;
+
+               default:
+                       error = zpool_standard_error_fmt(hdl, errno,
+                           dgettext(TEXT_DOMAIN, "cannot get event"));
+                       break;
+               }
+       }
+
+       return (error);
+}
+
  void
  zpool_obj_to_path(zpool_handle_t *zhp, uint64_t dsobj, uint64_t obj,
      char *pathname, size_t len)
  {
-       zfs_cmd_t zc = { 0 };
+       zfs_cmd_t zc = {"\0"};
         boolean_t mounted = B_FALSE;
         char *mntpnt = NULL;
-       char dsname[MAXNAMELEN];
+       char dsname[ZFS_MAX_DATASET_NAME_LEN];
  
         if (dsobj == 0) {
                 /* special case for the MOS */
-               (void) snprintf(pathname, len, "<metadata>:<0x%llx>", obj);
+               (void) snprintf(pathname, len, "<metadata>:<0x%llx>",
+                   (longlong_t)obj);
                 return;
         }
  
@@ -3430,7 +4146,7 @@ zpool_obj_to_path(zpool_handle_t *zhp, uint64_t dsobj, uint64_t obj,
             ZFS_IOC_DSOBJ_TO_DSNAME, &zc) != 0) {
                 /* just write out a path of two object numbers */
                 (void) snprintf(pathname, len, "<0x%llx>:<0x%llx>",
-                   dsobj, obj);
+                   (longlong_t)dsobj, (longlong_t)obj);
                 return;
         }
         (void) strlcpy(dsname, zc.zc_value, sizeof (dsname));
@@ -3451,7 +4167,8 @@ zpool_obj_to_path(zpool_handle_t *zhp, uint64_t dsobj, uint64_t obj,
                             dsname, zc.zc_value);
                 }
         } else {
-               (void) snprintf(pathname, len, "%s:<0x%llx>", dsname, obj);
+               (void) snprintf(pathname, len, "%s:<0x%llx>", dsname,
+                   (longlong_t)obj);
         }
         free(mntpnt);
  }
@@ -3473,9 +4190,9 @@ read_efi_label(nvlist_t *config, diskaddr_t *sb)
         if (nvlist_lookup_string(config, ZPOOL_CONFIG_PATH, &path) != 0)
                 return (err);
  
-       (void) snprintf(diskname, sizeof (diskname), "%s%s", RDISK_ROOT,
+       (void) snprintf(diskname, sizeof (diskname), "%s%s", DISK_ROOT,
             strrchr(path, '/'));
-       if ((fd = open(diskname, O_RDONLY|O_NDELAY)) >= 0) {
+       if ((fd = open(diskname, O_RDONLY|O_DIRECT)) >= 0) {
                 struct dk_gpt *vtoc;
  
                 if ((err = efi_alloc_and_read(fd, &vtoc)) >= 0) {
@@ -3521,6 +4238,57 @@ find_start_block(nvlist_t *config)
         return (MAXOFFSET_T);
  }
  
+static int
+zpool_label_disk_check(char *path)
+{
+       struct dk_gpt *vtoc;
+       int fd, err;
+
+       if ((fd = open(path, O_RDONLY|O_DIRECT)) < 0)
+               return (errno);
+
+       if ((err = efi_alloc_and_read(fd, &vtoc)) != 0) {
+               (void) close(fd);
+               return (err);
+       }
+
+       if (vtoc->efi_flags & EFI_GPT_PRIMARY_CORRUPT) {
+               efi_free(vtoc);
+               (void) close(fd);
+               return (EIDRM);
+       }
+
+       efi_free(vtoc);
+       (void) close(fd);
+       return (0);
+}
+
+/*
+ * Generate a unique partition name for the ZFS member.  Partitions must
+ * have unique names to ensure udev will be able to create symlinks under
+ * /dev/disk/by-partlabel/ for all pool members.  The partition names are
+ * of the form <pool>-<unique-id>.
+ */
+static void
+zpool_label_name(char *label_name, int label_size)
+{
+       uint64_t id = 0;
+       int fd;
+
+       fd = open("/dev/urandom", O_RDONLY);
+       if (fd >= 0) {
+               if (read(fd, &id, sizeof (id)) != sizeof (id))
+                       id = 0;
+
+               close(fd);
+       }
+
+       if (id == 0)
+               id = (((uint64_t)rand()) << 32) | (uint64_t)rand();
+
+       snprintf(label_name, label_size, "zfs-%016llx", (u_longlong_t)id);
+}
+
  /*
   * Label an individual disk.  The name provided is the short name,
   * stripped of any leading /dev path.
@@ -3530,7 +4298,7 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
  {
         char path[MAXPATHLEN];
         struct dk_gpt *vtoc;
-       int fd;
+       int rval, fd;
         size_t resv = EFI_MIN_RESV_SIZE;
         uint64_t slice_size;
         diskaddr_t start_block;
@@ -3543,13 +4311,6 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
         if (zhp) {
                 nvlist_t *nvroot;
  
-               if (pool_is_bootable(zhp)) {
-                       zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                           "EFI labeled devices are not supported on root "
-                           "pools."));
-                       return (zfs_error(hdl, EZFS_POOL_NOTSUP, errbuf));
-               }
-
                 verify(nvlist_lookup_nvlist(zhp->zpool_config,
                     ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
  
@@ -3563,16 +4324,15 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
                 start_block = NEW_START_BLOCK;
         }
  
-       (void) snprintf(path, sizeof (path), "%s/%s%s", RDISK_ROOT, name,
-           BACKUP_SLICE);
+       (void) snprintf(path, sizeof (path), "%s/%s", DISK_ROOT, name);
  
-       if ((fd = open(path, O_RDWR | O_NDELAY)) < 0) {
+       if ((fd = open(path, O_RDWR|O_DIRECT|O_EXCL)) < 0) {
                 /*
                  * This shouldn't happen.  We've long since verified that this
                  * is a valid device.
                  */
-               zfs_error_aux(hdl,
-                   dgettext(TEXT_DOMAIN, "unable to open device"));
+               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "cannot "
+                   "label '%s': unable to open device: %d"), path, errno);
                 return (zfs_error(hdl, EZFS_OPENFAILED, errbuf));
         }
  
@@ -3585,8 +4345,8 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
                         (void) no_memory(hdl);
  
                 (void) close(fd);
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "unable to read disk capacity"), name);
+               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "cannot "
+                   "label '%s': unable to read disk capacity"), path);
  
                 return (zfs_error(hdl, EZFS_NOCAP, errbuf));
         }
@@ -3596,6 +4356,7 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
         if (start_block == MAXOFFSET_T)
                 start_block = NEW_START_BLOCK;
         slice_size -= start_block;
+       slice_size = P2ALIGN(slice_size, PARTITION_END_ALIGNMENT);
  
         vtoc->efi_parts[0].p_start = start_block;
         vtoc->efi_parts[0].p_size = slice_size;
@@ -3609,139 +4370,337 @@ zpool_label_disk(libzfs_handle_t *hdl, zpool_handle_t *zhp, char *name)
          * can get, in the absence of V_OTHER.
          */
         vtoc->efi_parts[0].p_tag = V_USR;
-       (void) strcpy(vtoc->efi_parts[0].p_name, "zfs");
+       zpool_label_name(vtoc->efi_parts[0].p_name, EFI_PART_NAME_LEN);
  
         vtoc->efi_parts[8].p_start = slice_size + start_block;
         vtoc->efi_parts[8].p_size = resv;
         vtoc->efi_parts[8].p_tag = V_RESERVED;
  
-       if (efi_write(fd, vtoc) != 0) {
-               /*
-                * Some block drivers (like pcata) may not support EFI
-                * GPT labels.  Print out a helpful error message dir-
-                * ecting the user to manually label the disk and give
-                * a specific slice.
-                */
+       rval = efi_write(fd, vtoc);
+
+       /* Flush the buffers to disk and invalidate the page cache. */
+       (void) fsync(fd);
+       (void) ioctl(fd, BLKFLSBUF);
+
+       if (rval == 0)
+               rval = efi_rescan(fd);
+
+       /*
+        * Some block drivers (like pcata) may not support EFI GPT labels.
+        * Print out a helpful error message directing the user to manually
+        * label the disk and give a specific slice.
+        */
+       if (rval != 0) {
                 (void) close(fd);
                 efi_free(vtoc);
  
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "try using fdisk(1M) and then provide a specific slice"));
+               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "try using "
+                   "parted(8) and then provide a specific slice: %d"), rval);
                 return (zfs_error(hdl, EZFS_LABELFAILED, errbuf));
         }
  
         (void) close(fd);
         efi_free(vtoc);
+
+       (void) snprintf(path, sizeof (path), "%s/%s", DISK_ROOT, name);
+       (void) zfs_append_partition(path, MAXPATHLEN);
+
+       /* Wait to udev to signal use the device has settled. */
+       rval = zpool_label_disk_wait(path, DISK_LABEL_WAIT);
+       if (rval) {
+               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "failed to "
+                   "detect device partitions on '%s': %d"), path, rval);
+               return (zfs_error(hdl, EZFS_LABELFAILED, errbuf));
+       }
+
+       /* We can't be to paranoid.  Read the label back and verify it. */
+       (void) snprintf(path, sizeof (path), "%s/%s", DISK_ROOT, name);
+       rval = zpool_label_disk_check(path);
+       if (rval) {
+               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "freshly written "
+                   "EFI label on '%s' is damaged.  Ensure\nthis device "
+                   "is not in in use, and is functioning properly: %d"),
+                   path, rval);
+               return (zfs_error(hdl, EZFS_LABELFAILED, errbuf));
+       }
+
         return (0);
  }
  
-static boolean_t
-supported_dump_vdev_type(libzfs_handle_t *hdl, nvlist_t *config, char *errbuf)
+/*
+ * Allocate and return the underlying device name for a device mapper device.
+ * If a device mapper device maps to multiple devices, return the first device.
+ *
+ * For example, dm_name = "/dev/dm-0" could return "/dev/sda". Symlinks to a
+ * DM device (like /dev/disk/by-vdev/A0) are also allowed.
+ *
+ * Returns device name, or NULL on error or no match.  If dm_name is not a DM
+ * device then return NULL.
+ *
+ * NOTE: The returned name string must be *freed*.
+ */
+char *
+dm_get_underlying_path(char *dm_name)
  {
-       char *type;
-       nvlist_t **child;
-       uint_t children, c;
-
-       verify(nvlist_lookup_string(config, ZPOOL_CONFIG_TYPE, &type) == 0);
-       if (strcmp(type, VDEV_TYPE_RAIDZ) == 0 ||
-           strcmp(type, VDEV_TYPE_FILE) == 0 ||
-           strcmp(type, VDEV_TYPE_LOG) == 0 ||
-           strcmp(type, VDEV_TYPE_HOLE) == 0 ||
-           strcmp(type, VDEV_TYPE_MISSING) == 0) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "vdev type '%s' is not supported"), type);
-               (void) zfs_error(hdl, EZFS_VDEVNOTSUP, errbuf);
-               return (B_FALSE);
-       }
-       if (nvlist_lookup_nvlist_array(config, ZPOOL_CONFIG_CHILDREN,
-           &child, &children) == 0) {
-               for (c = 0; c < children; c++) {
-                       if (!supported_dump_vdev_type(hdl, child[c], errbuf))
-                               return (B_FALSE);
+       DIR *dp = NULL;
+       struct dirent *ep;
+       char *realp;
+       char *tmp = NULL;
+       char *path = NULL;
+       char *dev_str;
+       int size;
+
+       if (dm_name == NULL)
+               return (NULL);
+
+       /* dm name may be a symlink (like /dev/disk/by-vdev/A0) */
+       realp = realpath(dm_name, NULL);
+       if (realp == NULL)
+               return (NULL);
+
+       /*
+        * If they preface 'dev' with a path (like "/dev") then strip it off.
+        * We just want the 'dm-N' part.
+        */
+       tmp = strrchr(realp, '/');
+       if (tmp != NULL)
+               dev_str = tmp + 1;    /* +1 since we want the chr after '/' */
+       else
+               dev_str = tmp;
+
+       size = asprintf(&tmp, "/sys/block/%s/slaves/", dev_str);
+       if (size == -1 || !tmp)
+               goto end;
+
+       dp = opendir(tmp);
+       if (dp == NULL)
+               goto end;
+
+       /* Return first sd* entry in /sys/block/dm-N/slaves/ */
+       while ((ep = readdir(dp))) {
+               if (ep->d_type != DT_DIR) {     /* skip "." and ".." dirs */
+                       size = asprintf(&path, "/dev/%s", ep->d_name);
+                       break;
                 }
         }
-       return (B_TRUE);
+
+end:
+       if (dp != NULL)
+               closedir(dp);
+       free(tmp);
+       free(realp);
+       return (path);
  }
  
  /*
- * check if this zvol is allowable for use as a dump device; zero if
- * it is, > 0 if it isn't, < 0 if it isn't a zvol
+ * Return 1 if device is a device mapper or multipath device.
+ * Return 0 if not.
   */
  int
-zvol_check_dump_config(char *arg)
-{
-       zpool_handle_t *zhp = NULL;
-       nvlist_t *config, *nvroot;
-       char *p, *volname;
-       nvlist_t **top;
-       uint_t toplevels;
-       libzfs_handle_t *hdl;
-       char errbuf[1024];
-       char poolname[ZPOOL_MAXNAMELEN];
-       int pathlen = strlen(ZVOL_FULL_DEV_DIR);
-       int ret = 1;
+zfs_dev_is_dm(char *dev_name)
+{
  
-       if (strncmp(arg, ZVOL_FULL_DEV_DIR, pathlen)) {
-               return (-1);
-       }
+       char *tmp;
+       tmp = dm_get_underlying_path(dev_name);
+       if (tmp == NULL)
+               return (0);
  
-       (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN,
-           "dump is not supported on device '%s'"), arg);
+       free(tmp);
+       return (1);
+}
  
-       if ((hdl = libzfs_init()) == NULL)
-               return (1);
-       libzfs_print_on_error(hdl, B_TRUE);
+/*
+ * By "whole disk" we mean an entire physical disk (something we can
+ * label, toggle the write cache on, etc.) as opposed to the full
+ * capacity of a pseudo-device such as lofi or did.  We act as if we
+ * are labeling the disk, which should be a pretty good test of whether
+ * it's a viable device or not.  Returns B_TRUE if it is and B_FALSE if
+ * it isn't.
+ */
+int
+zfs_dev_is_whole_disk(char *dev_name)
+{
+       struct dk_gpt *label;
+       int fd;
  
-       volname = arg + pathlen;
+       if ((fd = open(dev_name, O_RDONLY | O_DIRECT)) < 0)
+               return (0);
  
-       /* check the configuration of the pool */
-       if ((p = strchr(volname, '/')) == NULL) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "malformed dataset name"));
-               (void) zfs_error(hdl, EZFS_INVALIDNAME, errbuf);
-               return (1);
-       } else if (p - volname >= ZFS_MAXNAMELEN) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "dataset name is too long"));
-               (void) zfs_error(hdl, EZFS_NAMETOOLONG, errbuf);
-               return (1);
-       } else {
-               (void) strncpy(poolname, volname, p - volname);
-               poolname[p - volname] = '\0';
+       if (efi_alloc_and_init(fd, EFI_NUMPAR, &label) != 0) {
+               (void) close(fd);
+               return (0);
         }
  
-       if ((zhp = zpool_open(hdl, poolname)) == NULL) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "could not open pool '%s'"), poolname);
-               (void) zfs_error(hdl, EZFS_OPENFAILED, errbuf);
-               goto out;
+       efi_free(label);
+       (void) close(fd);
+
+       return (1);
+}
+
+/*
+ * Lookup the underlying device for a device name
+ *
+ * Often you'll have a symlink to a device, a partition device,
+ * or a multipath device, and want to look up the underlying device.
+ * This function returns the underlying device name.  If the device
+ * name is already the underlying device, then just return the same
+ * name.  If the device is a DM device with multiple underlying devices
+ * then return the first one.
+ *
+ * For example:
+ *
+ * 1. /dev/disk/by-id/ata-QEMU_HARDDISK_QM00001 -> ../../sda
+ * dev_name:   /dev/disk/by-id/ata-QEMU_HARDDISK_QM00001
+ * returns:    /dev/sda
+ *
+ * 2. /dev/mapper/mpatha (made up of /dev/sda and /dev/sdb)
+ * dev_name:   /dev/mapper/mpatha
+ * returns:    /dev/sda (first device)
+ *
+ * 3. /dev/sda (already the underlying device)
+ * dev_name:   /dev/sda
+ * returns:    /dev/sda
+ *
+ * 4. /dev/dm-3 (mapped to /dev/sda)
+ * dev_name:   /dev/dm-3
+ * returns:    /dev/sda
+ *
+ * 5. /dev/disk/by-id/scsi-0QEMU_drive-scsi0-0-0-0-part9 -> ../../sdb9
+ * dev_name:   /dev/disk/by-id/scsi-0QEMU_drive-scsi0-0-0-0-part9
+ * returns:    /dev/sdb
+ *
+ * 6. /dev/disk/by-uuid/5df030cf-3cd9-46e4-8e99-3ccb462a4e9a -> ../dev/sda2
+ * dev_name:   /dev/disk/by-uuid/5df030cf-3cd9-46e4-8e99-3ccb462a4e9a
+ * returns:    /dev/sda
+ *
+ * Returns underlying device name, or NULL on error or no match.
+ *
+ * NOTE: The returned name string must be *freed*.
+ */
+char *
+zfs_get_underlying_path(char *dev_name)
+{
+       char *name = NULL;
+       char *tmp;
+
+       if (dev_name == NULL)
+               return (NULL);
+
+       tmp = dm_get_underlying_path(dev_name);
+
+       /* dev_name not a DM device, so just un-symlinkize it */
+       if (tmp == NULL)
+               tmp = realpath(dev_name, NULL);
+
+       if (tmp != NULL) {
+               name = zfs_strip_partition_path(tmp);
+               free(tmp);
         }
-       config = zpool_get_config(zhp, NULL);
-       if (nvlist_lookup_nvlist(config, ZPOOL_CONFIG_VDEV_TREE,
-           &nvroot) != 0) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "could not obtain vdev configuration for  '%s'"), poolname);
-               (void) zfs_error(hdl, EZFS_INVALCONFIG, errbuf);
-               goto out;
+
+       return (name);
+}
+
+/*
+ * Given a dev name like "sda", return the full enclosure sysfs path to
+ * the disk.  You can also pass in the name with "/dev" prepended
+ * to it (like /dev/sda).
+ *
+ * For example, disk "sda" in enclosure slot 1:
+ *     dev:            "sda"
+ *     returns:        "/sys/class/enclosure/1:0:3:0/Slot 1"
+ *
+ * 'dev' must be a non-devicemapper device.
+ *
+ * Returned string must be freed.
+ */
+char *
+zfs_get_enclosure_sysfs_path(char *dev_name)
+{
+       DIR *dp = NULL;
+       struct dirent *ep;
+       char buf[MAXPATHLEN];
+       char *tmp1 = NULL;
+       char *tmp2 = NULL;
+       char *tmp3 = NULL;
+       char *path = NULL;
+       size_t size;
+       int tmpsize;
+
+       if (dev_name == NULL)
+               return (NULL);
+
+       /* If they preface 'dev' with a path (like "/dev") then strip it off */
+       tmp1 = strrchr(dev_name, '/');
+       if (tmp1 != NULL)
+               dev_name = tmp1 + 1;    /* +1 since we want the chr after '/' */
+
+       tmpsize = asprintf(&tmp1, "/sys/block/%s/device", dev_name);
+       if (tmpsize == -1 || tmp1 == NULL) {
+               tmp1 = NULL;
+               goto end;
         }
  
-       verify(nvlist_lookup_nvlist_array(nvroot, ZPOOL_CONFIG_CHILDREN,
-           &top, &toplevels) == 0);
-       if (toplevels != 1) {
-               zfs_error_aux(hdl, dgettext(TEXT_DOMAIN,
-                   "'%s' has multiple top level vdevs"), poolname);
-               (void) zfs_error(hdl, EZFS_DEVOVERFLOW, errbuf);
-               goto out;
+       dp = opendir(tmp1);
+       if (dp == NULL) {
+               tmp1 = NULL;    /* To make free() at the end a NOP */
+               goto end;
         }
  
-       if (!supported_dump_vdev_type(hdl, top[0], errbuf)) {
-               goto out;
+       /*
+        * Look though all sysfs entries in /sys/block/<dev>/device for
+        * the enclosure symlink.
+        */
+       while ((ep = readdir(dp))) {
+               /* Ignore everything that's not our enclosure_device link */
+               if (strstr(ep->d_name, "enclosure_device") == NULL)
+                       continue;
+
+               if (asprintf(&tmp2, "%s/%s", tmp1, ep->d_name) == -1 ||
+                   tmp2 == NULL)
+                       break;
+
+               size = readlink(tmp2, buf, sizeof (buf));
+
+               /* Did readlink fail or crop the link name? */
+               if (size == -1 || size >= sizeof (buf)) {
+                       free(tmp2);
+                       tmp2 = NULL;    /* To make free() at the end a NOP */
+                       break;
+               }
+
+               /*
+                * We got a valid link.  readlink() doesn't terminate strings
+                * so we have to do it.
+                */
+               buf[size] = '\0';
+
+               /*
+                * Our link will look like:
+                *
+                * "../../../../port-11:1:2/..STUFF../enclosure/1:0:3:0/SLOT 1"
+                *
+                * We want to grab the "enclosure/1:0:3:0/SLOT 1" part
+                */
+               tmp3 = strstr(buf, "enclosure");
+               if (tmp3 == NULL)
+                       break;
+
+               if (asprintf(&path, "/sys/class/%s", tmp3) == -1) {
+                       /* If asprintf() fails, 'path' is undefined */
+                       path = NULL;
+                       break;
+               }
+
+               if (path == NULL)
+                       break;
         }
-       ret = 0;
  
-out:
-       if (zhp)
-               zpool_close(zhp);
-       libzfs_fini(hdl);
-       return (ret);
+end:
+       free(tmp2);
+       free(tmp1);
+
+       if (dp != NULL)
+               closedir(dp);
+
+       return (path);
  }