Index: stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs.h
===================================================================
--- stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs.h	(revision 326297)
+++ stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs.h	(revision 326298)
@@ -1,818 +1,819 @@
 /*
  * CDDL HEADER START
  *
  * The contents of this file are subject to the terms of the
  * Common Development and Distribution License (the "License").
  * You may not use this file except in compliance with the License.
  *
  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  * or http://www.opensolaris.org/os/licensing.
  * See the License for the specific language governing permissions
  * and limitations under the License.
  *
  * When distributing Covered Code, include this CDDL HEADER in each
  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  * If applicable, add the following below this CDDL HEADER, with the
  * fields enclosed by brackets "[]" replaced with your own identifying
  * information: Portions Copyright [yyyy] [name of copyright owner]
  *
  * CDDL HEADER END
  */
 
 /*
  * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
  * Copyright (c) 2011 Pawel Jakub Dawidek. All rights reserved.
  * Copyright (c) 2011, 2015 by Delphix. All rights reserved.
  * Copyright (c) 2012, Joyent, Inc. All rights reserved.
  * Copyright (c) 2012 Martin Matuska <mm@FreeBSD.org>. All rights reserved.
  * Copyright (c) 2013 Steven Hartland. All rights reserved.
  * Copyright (c) 2014 Integros [integros.com]
  * Copyright 2016 Nexenta Systems, Inc.
  * Copyright (c) 2017 Datto Inc.
  */
 
 #ifndef	_LIBZFS_H
 #define	_LIBZFS_H
 
 #include <assert.h>
 #include <libnvpair.h>
 #include <sys/mnttab.h>
 #include <sys/param.h>
 #include <sys/types.h>
 #include <sys/varargs.h>
 #include <sys/fs/zfs.h>
 #include <sys/avl.h>
 #include <sys/zfs_ioctl.h>
 #include <libzfs_core.h>
 
 #ifdef	__cplusplus
 extern "C" {
 #endif
 
 /*
  * Miscellaneous ZFS constants
  */
 #define	ZFS_MAXPROPLEN		MAXPATHLEN
 #define	ZPOOL_MAXPROPLEN	MAXPATHLEN
 
 /*
  * libzfs errors
  */
 typedef enum zfs_error {
 	EZFS_SUCCESS = 0,	/* no error -- success */
 	EZFS_NOMEM = 2000,	/* out of memory */
 	EZFS_BADPROP,		/* invalid property value */
 	EZFS_PROPREADONLY,	/* cannot set readonly property */
 	EZFS_PROPTYPE,		/* property does not apply to dataset type */
 	EZFS_PROPNONINHERIT,	/* property is not inheritable */
 	EZFS_PROPSPACE,		/* bad quota or reservation */
 	EZFS_BADTYPE,		/* dataset is not of appropriate type */
 	EZFS_BUSY,		/* pool or dataset is busy */
 	EZFS_EXISTS,		/* pool or dataset already exists */
 	EZFS_NOENT,		/* no such pool or dataset */
 	EZFS_BADSTREAM,		/* bad backup stream */
 	EZFS_DSREADONLY,	/* dataset is readonly */
 	EZFS_VOLTOOBIG,		/* volume is too large for 32-bit system */
 	EZFS_INVALIDNAME,	/* invalid dataset name */
 	EZFS_BADRESTORE,	/* unable to restore to destination */
 	EZFS_BADBACKUP,		/* backup failed */
 	EZFS_BADTARGET,		/* bad attach/detach/replace target */
 	EZFS_NODEVICE,		/* no such device in pool */
 	EZFS_BADDEV,		/* invalid device to add */
 	EZFS_NOREPLICAS,	/* no valid replicas */
 	EZFS_RESILVERING,	/* currently resilvering */
 	EZFS_BADVERSION,	/* unsupported version */
 	EZFS_POOLUNAVAIL,	/* pool is currently unavailable */
 	EZFS_DEVOVERFLOW,	/* too many devices in one vdev */
 	EZFS_BADPATH,		/* must be an absolute path */
 	EZFS_CROSSTARGET,	/* rename or clone across pool or dataset */
 	EZFS_ZONED,		/* used improperly in local zone */
 	EZFS_MOUNTFAILED,	/* failed to mount dataset */
 	EZFS_UMOUNTFAILED,	/* failed to unmount dataset */
 	EZFS_UNSHARENFSFAILED,	/* unshare(1M) failed */
 	EZFS_SHARENFSFAILED,	/* share(1M) failed */
 	EZFS_PERM,		/* permission denied */
 	EZFS_NOSPC,		/* out of space */
 	EZFS_FAULT,		/* bad address */
 	EZFS_IO,		/* I/O error */
 	EZFS_INTR,		/* signal received */
 	EZFS_ISSPARE,		/* device is a hot spare */
 	EZFS_INVALCONFIG,	/* invalid vdev configuration */
 	EZFS_RECURSIVE,		/* recursive dependency */
 	EZFS_NOHISTORY,		/* no history object */
 	EZFS_POOLPROPS,		/* couldn't retrieve pool props */
 	EZFS_POOL_NOTSUP,	/* ops not supported for this type of pool */
 	EZFS_POOL_INVALARG,	/* invalid argument for this pool operation */
 	EZFS_NAMETOOLONG,	/* dataset name is too long */
 	EZFS_OPENFAILED,	/* open of device failed */
 	EZFS_NOCAP,		/* couldn't get capacity */
 	EZFS_LABELFAILED,	/* write of label failed */
 	EZFS_BADWHO,		/* invalid permission who */
 	EZFS_BADPERM,		/* invalid permission */
 	EZFS_BADPERMSET,	/* invalid permission set name */
 	EZFS_NODELEGATION,	/* delegated administration is disabled */
 	EZFS_UNSHARESMBFAILED,	/* failed to unshare over smb */
 	EZFS_SHARESMBFAILED,	/* failed to share over smb */
 	EZFS_BADCACHE,		/* bad cache file */
 	EZFS_ISL2CACHE,		/* device is for the level 2 ARC */
 	EZFS_VDEVNOTSUP,	/* unsupported vdev type */
 	EZFS_NOTSUP,		/* ops not supported on this dataset */
 	EZFS_ACTIVE_SPARE,	/* pool has active shared spare devices */
 	EZFS_UNPLAYED_LOGS,	/* log device has unplayed logs */
 	EZFS_REFTAG_RELE,	/* snapshot release: tag not found */
 	EZFS_REFTAG_HOLD,	/* snapshot hold: tag already exists */
 	EZFS_TAGTOOLONG,	/* snapshot hold/rele: tag too long */
 	EZFS_PIPEFAILED,	/* pipe create failed */
 	EZFS_THREADCREATEFAILED, /* thread create failed */
 	EZFS_POSTSPLIT_ONLINE,	/* onlining a disk after splitting it */
 	EZFS_SCRUBBING,		/* currently scrubbing */
 	EZFS_NO_SCRUB,		/* no active scrub */
 	EZFS_DIFF,		/* general failure of zfs diff */
 	EZFS_DIFFDATA,		/* bad zfs diff data */
 	EZFS_POOLREADONLY,	/* pool is in read-only mode */
 	EZFS_SCRUB_PAUSED,	/* scrub currently paused */
 	EZFS_UNKNOWN
 } zfs_error_t;
 
 /*
  * The following data structures are all part
  * of the zfs_allow_t data structure which is
  * used for printing 'allow' permissions.
  * It is a linked list of zfs_allow_t's which
  * then contain avl tree's for user/group/sets/...
  * and each one of the entries in those trees have
  * avl tree's for the permissions they belong to and
  * whether they are local,descendent or local+descendent
  * permissions.  The AVL trees are used primarily for
  * sorting purposes, but also so that we can quickly find
  * a given user and or permission.
  */
 typedef struct zfs_perm_node {
 	avl_node_t z_node;
 	char z_pname[MAXPATHLEN];
 } zfs_perm_node_t;
 
 typedef struct zfs_allow_node {
 	avl_node_t z_node;
 	char z_key[MAXPATHLEN];		/* name, such as joe */
 	avl_tree_t z_localdescend;	/* local+descendent perms */
 	avl_tree_t z_local;		/* local permissions */
 	avl_tree_t z_descend;		/* descendent permissions */
 } zfs_allow_node_t;
 
 typedef struct zfs_allow {
 	struct zfs_allow *z_next;
 	char z_setpoint[MAXPATHLEN];
 	avl_tree_t z_sets;
 	avl_tree_t z_crperms;
 	avl_tree_t z_user;
 	avl_tree_t z_group;
 	avl_tree_t z_everyone;
 } zfs_allow_t;
 
 /*
  * Basic handle types
  */
 typedef struct zfs_handle zfs_handle_t;
 typedef struct zpool_handle zpool_handle_t;
 typedef struct libzfs_handle libzfs_handle_t;
 
 /*
  * Library initialization
  */
 extern libzfs_handle_t *libzfs_init(void);
 extern void libzfs_fini(libzfs_handle_t *);
 
 extern libzfs_handle_t *zpool_get_handle(zpool_handle_t *);
 extern libzfs_handle_t *zfs_get_handle(zfs_handle_t *);
 
 extern void libzfs_print_on_error(libzfs_handle_t *, boolean_t);
 
 extern void zfs_save_arguments(int argc, char **, char *, int);
 extern int zpool_log_history(libzfs_handle_t *, const char *);
 
 extern int libzfs_errno(libzfs_handle_t *);
 extern const char *libzfs_error_action(libzfs_handle_t *);
 extern const char *libzfs_error_description(libzfs_handle_t *);
 extern int zfs_standard_error(libzfs_handle_t *, int, const char *);
 extern void libzfs_mnttab_init(libzfs_handle_t *);
 extern void libzfs_mnttab_fini(libzfs_handle_t *);
 extern void libzfs_mnttab_cache(libzfs_handle_t *, boolean_t);
 extern int libzfs_mnttab_find(libzfs_handle_t *, const char *,
     struct mnttab *);
 extern void libzfs_mnttab_add(libzfs_handle_t *, const char *,
     const char *, const char *);
 extern void libzfs_mnttab_remove(libzfs_handle_t *, const char *);
 
 /*
  * Basic handle functions
  */
 extern zpool_handle_t *zpool_open(libzfs_handle_t *, const char *);
 extern zpool_handle_t *zpool_open_canfail(libzfs_handle_t *, const char *);
 extern void zpool_close(zpool_handle_t *);
 extern const char *zpool_get_name(zpool_handle_t *);
 extern int zpool_get_state(zpool_handle_t *);
 extern const char *zpool_state_to_name(vdev_state_t, vdev_aux_t);
 extern const char *zpool_pool_state_to_name(pool_state_t);
 extern void zpool_free_handles(libzfs_handle_t *);
 extern int zpool_nextboot(libzfs_handle_t *, uint64_t, uint64_t, const char *);
 
 /*
  * Iterate over all active pools in the system.
  */
 typedef int (*zpool_iter_f)(zpool_handle_t *, void *);
 extern int zpool_iter(libzfs_handle_t *, zpool_iter_f, void *);
 extern boolean_t zpool_skip_pool(const char *);
 
 /*
  * Functions to create and destroy pools
  */
 extern int zpool_create(libzfs_handle_t *, const char *, nvlist_t *,
     nvlist_t *, nvlist_t *);
 extern int zpool_destroy(zpool_handle_t *, const char *);
 extern int zpool_add(zpool_handle_t *, nvlist_t *);
 
 typedef struct splitflags {
 	/* do not split, but return the config that would be split off */
 	int dryrun : 1;
 
 	/* after splitting, import the pool */
 	int import : 1;
 } splitflags_t;
 
 /*
  * Functions to manipulate pool and vdev state
  */
 extern int zpool_scan(zpool_handle_t *, pool_scan_func_t, pool_scrub_cmd_t);
 extern int zpool_clear(zpool_handle_t *, const char *, nvlist_t *);
 extern int zpool_reguid(zpool_handle_t *);
 extern int zpool_reopen(zpool_handle_t *);
 
 extern int zpool_vdev_online(zpool_handle_t *, const char *, int,
     vdev_state_t *);
 extern int zpool_vdev_offline(zpool_handle_t *, const char *, boolean_t);
 extern int zpool_vdev_attach(zpool_handle_t *, const char *,
     const char *, nvlist_t *, int);
 extern int zpool_vdev_detach(zpool_handle_t *, const char *);
 extern int zpool_vdev_remove(zpool_handle_t *, const char *);
 extern int zpool_vdev_split(zpool_handle_t *, char *, nvlist_t **, nvlist_t *,
     splitflags_t);
 
 extern int zpool_vdev_fault(zpool_handle_t *, uint64_t, vdev_aux_t);
 extern int zpool_vdev_degrade(zpool_handle_t *, uint64_t, vdev_aux_t);
 extern int zpool_vdev_clear(zpool_handle_t *, uint64_t);
 
 extern nvlist_t *zpool_find_vdev(zpool_handle_t *, const char *, boolean_t *,
     boolean_t *, boolean_t *);
 extern nvlist_t *zpool_find_vdev_by_physpath(zpool_handle_t *, const char *,
     boolean_t *, boolean_t *, boolean_t *);
 extern int zpool_label_disk(libzfs_handle_t *, zpool_handle_t *, const char *);
 
 /*
  * Functions to manage pool properties
  */
 extern int zpool_set_prop(zpool_handle_t *, const char *, const char *);
 extern int zpool_get_prop(zpool_handle_t *, zpool_prop_t, char *,
     size_t proplen, zprop_source_t *, boolean_t);
 extern uint64_t zpool_get_prop_int(zpool_handle_t *, zpool_prop_t,
     zprop_source_t *);
 
 extern const char *zpool_prop_to_name(zpool_prop_t);
 extern const char *zpool_prop_values(zpool_prop_t);
 
 /*
  * Pool health statistics.
  */
 typedef enum {
 	/*
 	 * The following correspond to faults as defined in the (fault.fs.zfs.*)
 	 * event namespace.  Each is associated with a corresponding message ID.
 	 */
 	ZPOOL_STATUS_CORRUPT_CACHE,	/* corrupt /kernel/drv/zpool.cache */
 	ZPOOL_STATUS_MISSING_DEV_R,	/* missing device with replicas */
 	ZPOOL_STATUS_MISSING_DEV_NR,	/* missing device with no replicas */
 	ZPOOL_STATUS_CORRUPT_LABEL_R,	/* bad device label with replicas */
 	ZPOOL_STATUS_CORRUPT_LABEL_NR,	/* bad device label with no replicas */
 	ZPOOL_STATUS_BAD_GUID_SUM,	/* sum of device guids didn't match */
 	ZPOOL_STATUS_CORRUPT_POOL,	/* pool metadata is corrupted */
 	ZPOOL_STATUS_CORRUPT_DATA,	/* data errors in user (meta)data */
 	ZPOOL_STATUS_FAILING_DEV,	/* device experiencing errors */
 	ZPOOL_STATUS_VERSION_NEWER,	/* newer on-disk version */
 	ZPOOL_STATUS_HOSTID_MISMATCH,	/* last accessed by another system */
 	ZPOOL_STATUS_IO_FAILURE_WAIT,	/* failed I/O, failmode 'wait' */
 	ZPOOL_STATUS_IO_FAILURE_CONTINUE, /* failed I/O, failmode 'continue' */
 	ZPOOL_STATUS_BAD_LOG,		/* cannot read log chain(s) */
 
 	/*
 	 * If the pool has unsupported features but can still be opened in
 	 * read-only mode, its status is ZPOOL_STATUS_UNSUP_FEAT_WRITE. If the
 	 * pool has unsupported features but cannot be opened at all, its
 	 * status is ZPOOL_STATUS_UNSUP_FEAT_READ.
 	 */
 	ZPOOL_STATUS_UNSUP_FEAT_READ,	/* unsupported features for read */
 	ZPOOL_STATUS_UNSUP_FEAT_WRITE,	/* unsupported features for write */
 
 	/*
 	 * These faults have no corresponding message ID.  At the time we are
 	 * checking the status, the original reason for the FMA fault (I/O or
 	 * checksum errors) has been lost.
 	 */
 	ZPOOL_STATUS_FAULTED_DEV_R,	/* faulted device with replicas */
 	ZPOOL_STATUS_FAULTED_DEV_NR,	/* faulted device with no replicas */
 
 	/*
 	 * The following are not faults per se, but still an error possibly
 	 * requiring administrative attention.  There is no corresponding
 	 * message ID.
 	 */
 	ZPOOL_STATUS_VERSION_OLDER,	/* older legacy on-disk version */
 	ZPOOL_STATUS_FEAT_DISABLED,	/* supported features are disabled */
 	ZPOOL_STATUS_RESILVERING,	/* device being resilvered */
 	ZPOOL_STATUS_OFFLINE_DEV,	/* device offline */
 	ZPOOL_STATUS_REMOVED_DEV,	/* removed device */
 	ZPOOL_STATUS_NON_NATIVE_ASHIFT,	/* (e.g. 512e dev with ashift of 9) */
 
 	/*
 	 * Finally, the following indicates a healthy pool.
 	 */
 	ZPOOL_STATUS_OK
 } zpool_status_t;
 
 extern zpool_status_t zpool_get_status(zpool_handle_t *, char **);
 extern zpool_status_t zpool_import_status(nvlist_t *, char **);
 extern void zpool_dump_ddt(const ddt_stat_t *dds, const ddt_histogram_t *ddh);
 
 /*
  * Statistics and configuration functions.
  */
 extern nvlist_t *zpool_get_config(zpool_handle_t *, nvlist_t **);
 extern nvlist_t *zpool_get_features(zpool_handle_t *);
 extern int zpool_refresh_stats(zpool_handle_t *, boolean_t *);
 extern int zpool_get_errlog(zpool_handle_t *, nvlist_t **);
 
 /*
  * Import and export functions
  */
 extern int zpool_export(zpool_handle_t *, boolean_t, const char *);
 extern int zpool_export_force(zpool_handle_t *, const char *);
 extern int zpool_import(libzfs_handle_t *, nvlist_t *, const char *,
     char *altroot);
 extern int zpool_import_props(libzfs_handle_t *, nvlist_t *, const char *,
     nvlist_t *, int);
 extern void zpool_print_unsup_feat(nvlist_t *config);
 
 /*
  * Search for pools to import
  */
 
 typedef struct importargs {
 	char **path;		/* a list of paths to search		*/
 	int paths;		/* number of paths to search		*/
 	char *poolname;		/* name of a pool to find		*/
 	uint64_t guid;		/* guid of a pool to find		*/
 	char *cachefile;	/* cachefile to use for import		*/
 	int can_be_active : 1;	/* can the pool be active?		*/
 	int unique : 1;		/* does 'poolname' already exist?	*/
 	int exists : 1;		/* set on return if pool already exists	*/
 } importargs_t;
 
 extern nvlist_t *zpool_search_import(libzfs_handle_t *, importargs_t *);
 
 /* legacy pool search routines */
 extern nvlist_t *zpool_find_import(libzfs_handle_t *, int, char **);
 extern nvlist_t *zpool_find_import_cached(libzfs_handle_t *, const char *,
     char *, uint64_t);
 
 /*
  * Miscellaneous pool functions
  */
 struct zfs_cmd;
 
 extern const char *zfs_history_event_names[];
 
 extern char *zpool_vdev_name(libzfs_handle_t *, zpool_handle_t *, nvlist_t *,
     boolean_t verbose);
 extern int zpool_upgrade(zpool_handle_t *, uint64_t);
 extern int zpool_get_history(zpool_handle_t *, nvlist_t **);
 extern int zpool_history_unpack(char *, uint64_t, uint64_t *,
     nvlist_t ***, uint_t *);
 extern void zpool_obj_to_path(zpool_handle_t *, uint64_t, uint64_t, char *,
     size_t len);
 extern int zfs_ioctl(libzfs_handle_t *, int request, struct zfs_cmd *);
 extern int zpool_get_physpath(zpool_handle_t *, char *, size_t);
 extern void zpool_explain_recover(libzfs_handle_t *, const char *, int,
     nvlist_t *);
 
 /*
  * Basic handle manipulations.  These functions do not create or destroy the
  * underlying datasets, only the references to them.
  */
 extern zfs_handle_t *zfs_open(libzfs_handle_t *, const char *, int);
 extern zfs_handle_t *zfs_handle_dup(zfs_handle_t *);
 extern void zfs_close(zfs_handle_t *);
 extern zfs_type_t zfs_get_type(const zfs_handle_t *);
 extern const char *zfs_get_name(const zfs_handle_t *);
 extern zpool_handle_t *zfs_get_pool_handle(const zfs_handle_t *);
 extern const char *zfs_get_pool_name(const zfs_handle_t *);
 
 /*
  * Property management functions.  Some functions are shared with the kernel,
  * and are found in sys/fs/zfs.h.
  */
 
 /*
  * zfs dataset property management
  */
 extern const char *zfs_prop_default_string(zfs_prop_t);
 extern uint64_t zfs_prop_default_numeric(zfs_prop_t);
 extern const char *zfs_prop_column_name(zfs_prop_t);
 extern boolean_t zfs_prop_align_right(zfs_prop_t);
 
 extern nvlist_t *zfs_valid_proplist(libzfs_handle_t *, zfs_type_t,
     nvlist_t *, uint64_t, zfs_handle_t *, zpool_handle_t *, const char *);
 
 extern const char *zfs_prop_to_name(zfs_prop_t);
 extern int zfs_prop_set(zfs_handle_t *, const char *, const char *);
 extern int zfs_prop_set_list(zfs_handle_t *, nvlist_t *);
 extern int zfs_prop_get(zfs_handle_t *, zfs_prop_t, char *, size_t,
     zprop_source_t *, char *, size_t, boolean_t);
 extern int zfs_prop_get_recvd(zfs_handle_t *, const char *, char *, size_t,
     boolean_t);
 extern int zfs_prop_get_numeric(zfs_handle_t *, zfs_prop_t, uint64_t *,
     zprop_source_t *, char *, size_t);
 extern int zfs_prop_get_userquota_int(zfs_handle_t *zhp, const char *propname,
     uint64_t *propvalue);
 extern int zfs_prop_get_userquota(zfs_handle_t *zhp, const char *propname,
     char *propbuf, int proplen, boolean_t literal);
 extern int zfs_prop_get_written_int(zfs_handle_t *zhp, const char *propname,
     uint64_t *propvalue);
 extern int zfs_prop_get_written(zfs_handle_t *zhp, const char *propname,
     char *propbuf, int proplen, boolean_t literal);
 extern int zfs_prop_get_feature(zfs_handle_t *zhp, const char *propname,
     char *buf, size_t len);
 extern uint64_t zfs_prop_get_int(zfs_handle_t *, zfs_prop_t);
 extern int zfs_prop_inherit(zfs_handle_t *, const char *, boolean_t);
 extern const char *zfs_prop_values(zfs_prop_t);
 extern int zfs_prop_is_string(zfs_prop_t prop);
 extern nvlist_t *zfs_get_user_props(zfs_handle_t *);
 extern nvlist_t *zfs_get_recvd_props(zfs_handle_t *);
 extern nvlist_t *zfs_get_clones_nvl(zfs_handle_t *);
 
 
 typedef struct zprop_list {
 	int		pl_prop;
 	char		*pl_user_prop;
 	struct zprop_list *pl_next;
 	boolean_t	pl_all;
 	size_t		pl_width;
 	size_t		pl_recvd_width;
 	boolean_t	pl_fixed;
 } zprop_list_t;
 
 extern int zfs_expand_proplist(zfs_handle_t *, zprop_list_t **, boolean_t,
     boolean_t);
 extern void zfs_prune_proplist(zfs_handle_t *, uint8_t *);
 
 #define	ZFS_MOUNTPOINT_NONE	"none"
 #define	ZFS_MOUNTPOINT_LEGACY	"legacy"
 
 #define	ZFS_FEATURE_DISABLED	"disabled"
 #define	ZFS_FEATURE_ENABLED	"enabled"
 #define	ZFS_FEATURE_ACTIVE	"active"
 
 #define	ZFS_UNSUPPORTED_INACTIVE	"inactive"
 #define	ZFS_UNSUPPORTED_READONLY	"readonly"
 
 /*
  * zpool property management
  */
 extern int zpool_expand_proplist(zpool_handle_t *, zprop_list_t **);
 extern int zpool_prop_get_feature(zpool_handle_t *, const char *, char *,
     size_t);
 extern const char *zpool_prop_default_string(zpool_prop_t);
 extern uint64_t zpool_prop_default_numeric(zpool_prop_t);
 extern const char *zpool_prop_column_name(zpool_prop_t);
 extern boolean_t zpool_prop_align_right(zpool_prop_t);
 
 /*
  * Functions shared by zfs and zpool property management.
  */
 extern int zprop_iter(zprop_func func, void *cb, boolean_t show_all,
     boolean_t ordered, zfs_type_t type);
 extern int zprop_get_list(libzfs_handle_t *, char *, zprop_list_t **,
     zfs_type_t);
 extern void zprop_free_list(zprop_list_t *);
 
 #define	ZFS_GET_NCOLS	5
 
 typedef enum {
 	GET_COL_NONE,
 	GET_COL_NAME,
 	GET_COL_PROPERTY,
 	GET_COL_VALUE,
 	GET_COL_RECVD,
 	GET_COL_SOURCE
 } zfs_get_column_t;
 
 /*
  * Functions for printing zfs or zpool properties
  */
 typedef struct zprop_get_cbdata {
 	int cb_sources;
 	zfs_get_column_t cb_columns[ZFS_GET_NCOLS];
 	int cb_colwidths[ZFS_GET_NCOLS + 1];
 	boolean_t cb_scripted;
 	boolean_t cb_literal;
 	boolean_t cb_first;
 	zprop_list_t *cb_proplist;
 	zfs_type_t cb_type;
 } zprop_get_cbdata_t;
 
 void zprop_print_one_property(const char *, zprop_get_cbdata_t *,
     const char *, const char *, zprop_source_t, const char *,
     const char *);
 
 /*
  * Iterator functions.
  */
 typedef int (*zfs_iter_f)(zfs_handle_t *, void *);
 extern int zfs_iter_root(libzfs_handle_t *, zfs_iter_f, void *);
 extern int zfs_iter_children(zfs_handle_t *, zfs_iter_f, void *);
 extern int zfs_iter_dependents(zfs_handle_t *, boolean_t, zfs_iter_f, void *);
 extern int zfs_iter_filesystems(zfs_handle_t *, zfs_iter_f, void *);
 extern int zfs_iter_snapshots(zfs_handle_t *, boolean_t, zfs_iter_f, void *);
 extern int zfs_iter_snapshots_sorted(zfs_handle_t *, zfs_iter_f, void *);
 extern int zfs_iter_snapspec(zfs_handle_t *, const char *, zfs_iter_f, void *);
 extern int zfs_iter_bookmarks(zfs_handle_t *, zfs_iter_f, void *);
 
 typedef struct get_all_cb {
 	zfs_handle_t	**cb_handles;
 	size_t		cb_alloc;
 	size_t		cb_used;
 	boolean_t	cb_verbose;
 	int		(*cb_getone)(zfs_handle_t *, void *);
 } get_all_cb_t;
 
 void libzfs_add_handle(get_all_cb_t *, zfs_handle_t *);
 int libzfs_dataset_cmp(const void *, const void *);
 
 /*
  * Functions to create and destroy datasets.
  */
 extern int zfs_create(libzfs_handle_t *, const char *, zfs_type_t,
     nvlist_t *);
 extern int zfs_create_ancestors(libzfs_handle_t *, const char *);
 extern int zfs_destroy(zfs_handle_t *, boolean_t);
 extern int zfs_destroy_snaps(zfs_handle_t *, char *, boolean_t);
 extern int zfs_destroy_snaps_nvl(libzfs_handle_t *, nvlist_t *, boolean_t);
 extern int zfs_clone(zfs_handle_t *, const char *, nvlist_t *);
 extern int zfs_snapshot(libzfs_handle_t *, const char *, boolean_t, nvlist_t *);
 extern int zfs_snapshot_nvl(libzfs_handle_t *hdl, nvlist_t *snaps,
     nvlist_t *props);
 extern int zfs_rollback(zfs_handle_t *, zfs_handle_t *, boolean_t);
 
 typedef struct renameflags {
 	/* recursive rename */
 	int recurse : 1;
 
 	/* don't unmount file systems */
 	int nounmount : 1;
 
 	/* force unmount file systems */
 	int forceunmount : 1;
 } renameflags_t;
 
 extern int zfs_rename(zfs_handle_t *, const char *, const char *,
     renameflags_t flags);
 
 typedef struct sendflags {
 	/* print informational messages (ie, -v was specified) */
 	boolean_t verbose;
 
 	/* recursive send  (ie, -R) */
 	boolean_t replicate;
 
 	/* for incrementals, do all intermediate snapshots */
 	boolean_t doall;
 
 	/* if dataset is a clone, do incremental from its origin */
 	boolean_t fromorigin;
 
 	/* do deduplication */
 	boolean_t dedup;
 
 	/* send properties (ie, -p) */
 	boolean_t props;
 
 	/* do not send (no-op, ie. -n) */
 	boolean_t dryrun;
 
 	/* parsable verbose output (ie. -P) */
 	boolean_t parsable;
 
 	/* show progress (ie. -v) */
 	boolean_t progress;
 
 	/* large blocks (>128K) are permitted */
 	boolean_t largeblock;
 
 	/* WRITE_EMBEDDED records of type DATA are permitted */
 	boolean_t embed_data;
 
 	/* compressed WRITE records are permitted */
 	boolean_t compress;
 } sendflags_t;
 
 typedef boolean_t (snapfilter_cb_t)(zfs_handle_t *, void *);
 
 extern int zfs_send(zfs_handle_t *, const char *, const char *,
     sendflags_t *, int, snapfilter_cb_t, void *, nvlist_t **);
 extern int zfs_send_one(zfs_handle_t *, const char *, int, enum lzc_send_flags);
 extern int zfs_send_resume(libzfs_handle_t *, sendflags_t *, int outfd,
     const char *);
 extern nvlist_t *zfs_send_resume_token_to_nvlist(libzfs_handle_t *hdl,
     const char *token);
 
 extern int zfs_promote(zfs_handle_t *);
 extern int zfs_hold(zfs_handle_t *, const char *, const char *,
     boolean_t, int);
 extern int zfs_hold_nvl(zfs_handle_t *, int, nvlist_t *);
 extern int zfs_release(zfs_handle_t *, const char *, const char *, boolean_t);
 extern int zfs_get_holds(zfs_handle_t *, nvlist_t **);
 extern uint64_t zvol_volsize_to_reservation(uint64_t, nvlist_t *);
 
 typedef int (*zfs_userspace_cb_t)(void *arg, const char *domain,
     uid_t rid, uint64_t space);
 
 extern int zfs_userspace(zfs_handle_t *, zfs_userquota_prop_t,
     zfs_userspace_cb_t, void *);
 
 extern int zfs_get_fsacl(zfs_handle_t *, nvlist_t **);
 extern int zfs_set_fsacl(zfs_handle_t *, boolean_t, nvlist_t *);
 
 typedef struct recvflags {
 	/* print informational messages (ie, -v was specified) */
 	boolean_t verbose;
 
 	/* the destination is a prefix, not the exact fs (ie, -d) */
 	boolean_t isprefix;
 
 	/*
 	 * Only the tail of the sent snapshot path is appended to the
 	 * destination to determine the received snapshot name (ie, -e).
 	 */
 	boolean_t istail;
 
 	/* do not actually do the recv, just check if it would work (ie, -n) */
 	boolean_t dryrun;
 
 	/* rollback/destroy filesystems as necessary (eg, -F) */
 	boolean_t force;
 
 	/* set "canmount=off" on all modified filesystems */
 	boolean_t canmountoff;
 
 	/*
 	 * Mark the file systems as "resumable" and do not destroy them if the
 	 * receive is interrupted
 	 */
 	boolean_t resumable;
 
 	/* byteswap flag is used internally; callers need not specify */
 	boolean_t byteswap;
 
 	/* do not mount file systems as they are extracted (private) */
 	boolean_t nomount;
 } recvflags_t;
 
 extern int zfs_receive(libzfs_handle_t *, const char *, nvlist_t *,
     recvflags_t *, int, avl_tree_t *);
 
 typedef enum diff_flags {
 	ZFS_DIFF_PARSEABLE = 0x1,
 	ZFS_DIFF_TIMESTAMP = 0x2,
 	ZFS_DIFF_CLASSIFY = 0x4
 } diff_flags_t;
 
 extern int zfs_show_diffs(zfs_handle_t *, int, const char *, const char *,
     int);
 
 /*
  * Miscellaneous functions.
  */
 extern const char *zfs_type_to_name(zfs_type_t);
 extern void zfs_refresh_properties(zfs_handle_t *);
 extern int zfs_name_valid(const char *, zfs_type_t);
 extern zfs_handle_t *zfs_path_to_zhandle(libzfs_handle_t *, char *, zfs_type_t);
 extern boolean_t zfs_dataset_exists(libzfs_handle_t *, const char *,
     zfs_type_t);
 extern int zfs_spa_version(zfs_handle_t *, int *);
 extern boolean_t zfs_bookmark_exists(const char *path);
 
 /*
  * Mount support functions.
  */
 extern boolean_t is_mounted(libzfs_handle_t *, const char *special, char **);
 extern boolean_t zfs_is_mounted(zfs_handle_t *, char **);
 extern int zfs_mount(zfs_handle_t *, const char *, int);
 extern int zfs_unmount(zfs_handle_t *, const char *, int);
 extern int zfs_unmountall(zfs_handle_t *, int);
 
 /*
  * Share support functions.
  */
 extern boolean_t zfs_is_shared(zfs_handle_t *);
 extern int zfs_share(zfs_handle_t *);
 extern int zfs_unshare(zfs_handle_t *);
 
 /*
  * Protocol-specific share support functions.
  */
 extern boolean_t zfs_is_shared_nfs(zfs_handle_t *, char **);
 extern boolean_t zfs_is_shared_smb(zfs_handle_t *, char **);
 extern int zfs_share_nfs(zfs_handle_t *);
 extern int zfs_share_smb(zfs_handle_t *);
 extern int zfs_shareall(zfs_handle_t *);
 extern int zfs_unshare_nfs(zfs_handle_t *, const char *);
 extern int zfs_unshare_smb(zfs_handle_t *, const char *);
 extern int zfs_unshareall_nfs(zfs_handle_t *);
 extern int zfs_unshareall_smb(zfs_handle_t *);
 extern int zfs_unshareall_bypath(zfs_handle_t *, const char *);
 extern int zfs_unshareall(zfs_handle_t *);
 extern int zfs_deleg_share_nfs(libzfs_handle_t *, char *, char *, char *,
     void *, void *, int, zfs_share_op_t);
 
 /*
  * FreeBSD-specific jail support function.
  */
 extern int zfs_jail(zfs_handle_t *, int, int);
 
 /*
  * When dealing with nvlists, verify() is extremely useful
  */
 #ifndef verify
 #ifdef NDEBUG
 #define	verify(EX)	((void)(EX))
 #else
 #define	verify(EX)	assert(EX)
 #endif
 #endif
 
 /*
  * Utility function to convert a number to a human-readable form.
  */
 extern void zfs_nicenum(uint64_t, char *, size_t);
 extern int zfs_nicestrtonum(libzfs_handle_t *, const char *, uint64_t *);
 
 /*
  * Given a device or file, determine if it is part of a pool.
  */
 extern int zpool_in_use(libzfs_handle_t *, int, pool_state_t *, char **,
     boolean_t *);
 
 /*
  * Label manipulation.
  */
 extern int zpool_read_label(int, nvlist_t **);
+extern int zpool_read_all_labels(int, nvlist_t **);
 extern int zpool_clear_label(int);
 
 /* is this zvol valid for use as a dump device? */
 extern int zvol_check_dump_config(char *);
 
 /*
  * Management interfaces for SMB ACL files
  */
 
 int zfs_smb_acl_add(libzfs_handle_t *, char *, char *, char *);
 int zfs_smb_acl_remove(libzfs_handle_t *, char *, char *, char *);
 int zfs_smb_acl_purge(libzfs_handle_t *, char *, char *);
 int zfs_smb_acl_rename(libzfs_handle_t *, char *, char *, char *, char *);
 
 /*
  * Enable and disable datasets within a pool by mounting/unmounting and
  * sharing/unsharing them.
  */
 extern int zpool_enable_datasets(zpool_handle_t *, const char *, int);
 extern int zpool_disable_datasets(zpool_handle_t *, boolean_t);
 
 /*
  * Mappings between vdev and FRU.
  */
 extern void libzfs_fru_refresh(libzfs_handle_t *);
 extern const char *libzfs_fru_lookup(libzfs_handle_t *, const char *);
 extern const char *libzfs_fru_devpath(libzfs_handle_t *, const char *);
 extern boolean_t libzfs_fru_compare(libzfs_handle_t *, const char *,
     const char *);
 extern boolean_t libzfs_fru_notself(libzfs_handle_t *, const char *);
 extern int zpool_fru_set(zpool_handle_t *, uint64_t, const char *);
 
 #ifndef illumos
 extern int zmount(const char *, const char *, int, char *, char *, int, char *,
     int);
 #endif
 
 #ifdef	__cplusplus
 }
 #endif
 
 #endif	/* _LIBZFS_H */
Index: stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs_import.c
===================================================================
--- stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs_import.c	(revision 326297)
+++ stable/11/cddl/contrib/opensolaris/lib/libzfs/common/libzfs_import.c	(revision 326298)
@@ -1,1750 +1,1835 @@
 /*
  * CDDL HEADER START
  *
  * The contents of this file are subject to the terms of the
  * Common Development and Distribution License (the "License").
  * You may not use this file except in compliance with the License.
  *
  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  * or http://www.opensolaris.org/os/licensing.
  * See the License for the specific language governing permissions
  * and limitations under the License.
  *
  * When distributing Covered Code, include this CDDL HEADER in each
  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  * If applicable, add the following below this CDDL HEADER, with the
  * fields enclosed by brackets "[]" replaced with your own identifying
  * information: Portions Copyright [yyyy] [name of copyright owner]
  *
  * CDDL HEADER END
  */
 
 /*
  * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
  * Copyright (c) 2012, 2016 by Delphix. All rights reserved.
  * Copyright 2015 RackTop Systems.
  * Copyright 2016 Nexenta Systems, Inc.
  */
 
 /*
  * Pool import support functions.
  *
  * To import a pool, we rely on reading the configuration information from the
  * ZFS label of each device.  If we successfully read the label, then we
  * organize the configuration information in the following hierarchy:
  *
  * 	pool guid -> toplevel vdev guid -> label txg
  *
  * Duplicate entries matching this same tuple will be discarded.  Once we have
  * examined every device, we pick the best label txg config for each toplevel
  * vdev.  We then arrange these toplevel vdevs into a complete pool config, and
  * update any paths that have changed.  Finally, we attempt to import the pool
  * using our derived config, and record the results.
  */
 
+#include <aio.h>
 #include <ctype.h>
 #include <devid.h>
 #include <dirent.h>
 #include <errno.h>
 #include <libintl.h>
 #include <stddef.h>
 #include <stdlib.h>
 #include <string.h>
 #include <sys/stat.h>
 #include <unistd.h>
 #include <fcntl.h>
 #include <thread_pool.h>
 #include <libgeom.h>
 
 #include <sys/vdev_impl.h>
 
 #include "libzfs.h"
 #include "libzfs_impl.h"
 
 /*
  * Intermediate structures used to gather configuration information.
  */
 typedef struct config_entry {
 	uint64_t		ce_txg;
 	nvlist_t		*ce_config;
 	struct config_entry	*ce_next;
 } config_entry_t;
 
 typedef struct vdev_entry {
 	uint64_t		ve_guid;
 	config_entry_t		*ve_configs;
 	struct vdev_entry	*ve_next;
 } vdev_entry_t;
 
 typedef struct pool_entry {
 	uint64_t		pe_guid;
 	vdev_entry_t		*pe_vdevs;
 	struct pool_entry	*pe_next;
 } pool_entry_t;
 
 typedef struct name_entry {
 	char			*ne_name;
 	uint64_t		ne_guid;
 	struct name_entry	*ne_next;
 } name_entry_t;
 
 typedef struct pool_list {
 	pool_entry_t		*pools;
 	name_entry_t		*names;
 } pool_list_t;
 
 static char *
 get_devid(const char *path)
 {
 #ifdef have_devid
 	int fd;
 	ddi_devid_t devid;
 	char *minor, *ret;
 
 	if ((fd = open(path, O_RDONLY)) < 0)
 		return (NULL);
 
 	minor = NULL;
 	ret = NULL;
 	if (devid_get(fd, &devid) == 0) {
 		if (devid_get_minor_name(fd, &minor) == 0)
 			ret = devid_str_encode(devid, minor);
 		if (minor != NULL)
 			devid_str_free(minor);
 		devid_free(devid);
 	}
 	(void) close(fd);
 
 	return (ret);
 #else
 	return (NULL);
 #endif
 }
 
 
 /*
  * Go through and fix up any path and/or devid information for the given vdev
  * configuration.
  */
 static int
 fix_paths(nvlist_t *nv, name_entry_t *names)
 {
 	nvlist_t **child;
 	uint_t c, children;
 	uint64_t guid;
 	name_entry_t *ne, *best;
 	char *path, *devid;
 	int matched;
 
 	if (nvlist_lookup_nvlist_array(nv, ZPOOL_CONFIG_CHILDREN,
 	    &child, &children) == 0) {
 		for (c = 0; c < children; c++)
 			if (fix_paths(child[c], names) != 0)
 				return (-1);
 		return (0);
 	}
 
 	/*
 	 * This is a leaf (file or disk) vdev.  In either case, go through
 	 * the name list and see if we find a matching guid.  If so, replace
 	 * the path and see if we can calculate a new devid.
 	 *
 	 * There may be multiple names associated with a particular guid, in
 	 * which case we have overlapping slices or multiple paths to the same
 	 * disk.  If this is the case, then we want to pick the path that is
 	 * the most similar to the original, where "most similar" is the number
 	 * of matching characters starting from the end of the path.  This will
 	 * preserve slice numbers even if the disks have been reorganized, and
 	 * will also catch preferred disk names if multiple paths exist.
 	 */
 	verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID, &guid) == 0);
 	if (nvlist_lookup_string(nv, ZPOOL_CONFIG_PATH, &path) != 0)
 		path = NULL;
 
 	matched = 0;
 	best = NULL;
 	for (ne = names; ne != NULL; ne = ne->ne_next) {
 		if (ne->ne_guid == guid) {
 			const char *src, *dst;
 			int count;
 
 			if (path == NULL) {
 				best = ne;
 				break;
 			}
 
 			src = ne->ne_name + strlen(ne->ne_name) - 1;
 			dst = path + strlen(path) - 1;
 			for (count = 0; src >= ne->ne_name && dst >= path;
 			    src--, dst--, count++)
 				if (*src != *dst)
 					break;
 
 			/*
 			 * At this point, 'count' is the number of characters
 			 * matched from the end.
 			 */
 			if (count > matched || best == NULL) {
 				best = ne;
 				matched = count;
 			}
 		}
 	}
 
 	if (best == NULL)
 		return (0);
 
 	if (nvlist_add_string(nv, ZPOOL_CONFIG_PATH, best->ne_name) != 0)
 		return (-1);
 
 	if ((devid = get_devid(best->ne_name)) == NULL) {
 		(void) nvlist_remove_all(nv, ZPOOL_CONFIG_DEVID);
 	} else {
 		if (nvlist_add_string(nv, ZPOOL_CONFIG_DEVID, devid) != 0) {
 			devid_str_free(devid);
 			return (-1);
 		}
 		devid_str_free(devid);
 	}
 
 	return (0);
 }
 
 /*
  * Add the given configuration to the list of known devices.
  */
 static int
 add_config(libzfs_handle_t *hdl, pool_list_t *pl, const char *path,
     nvlist_t *config)
 {
 	uint64_t pool_guid, vdev_guid, top_guid, txg, state;
 	pool_entry_t *pe;
 	vdev_entry_t *ve;
 	config_entry_t *ce;
 	name_entry_t *ne;
 
 	/*
 	 * If this is a hot spare not currently in use or level 2 cache
 	 * device, add it to the list of names to translate, but don't do
 	 * anything else.
 	 */
 	if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_STATE,
 	    &state) == 0 &&
 	    (state == POOL_STATE_SPARE || state == POOL_STATE_L2CACHE) &&
 	    nvlist_lookup_uint64(config, ZPOOL_CONFIG_GUID, &vdev_guid) == 0) {
 		if ((ne = zfs_alloc(hdl, sizeof (name_entry_t))) == NULL)
 			return (-1);
 
 		if ((ne->ne_name = zfs_strdup(hdl, path)) == NULL) {
 			free(ne);
 			return (-1);
 		}
 		ne->ne_guid = vdev_guid;
 		ne->ne_next = pl->names;
 		pl->names = ne;
 		return (0);
 	}
 
 	/*
 	 * If we have a valid config but cannot read any of these fields, then
 	 * it means we have a half-initialized label.  In vdev_label_init()
 	 * we write a label with txg == 0 so that we can identify the device
 	 * in case the user refers to the same disk later on.  If we fail to
 	 * create the pool, we'll be left with a label in this state
 	 * which should not be considered part of a valid pool.
 	 */
 	if (nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID,
 	    &pool_guid) != 0 ||
 	    nvlist_lookup_uint64(config, ZPOOL_CONFIG_GUID,
 	    &vdev_guid) != 0 ||
 	    nvlist_lookup_uint64(config, ZPOOL_CONFIG_TOP_GUID,
 	    &top_guid) != 0 ||
 	    nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_TXG,
 	    &txg) != 0 || txg == 0) {
 		nvlist_free(config);
 		return (0);
 	}
 
 	/*
 	 * First, see if we know about this pool.  If not, then add it to the
 	 * list of known pools.
 	 */
 	for (pe = pl->pools; pe != NULL; pe = pe->pe_next) {
 		if (pe->pe_guid == pool_guid)
 			break;
 	}
 
 	if (pe == NULL) {
 		if ((pe = zfs_alloc(hdl, sizeof (pool_entry_t))) == NULL) {
 			nvlist_free(config);
 			return (-1);
 		}
 		pe->pe_guid = pool_guid;
 		pe->pe_next = pl->pools;
 		pl->pools = pe;
 	}
 
 	/*
 	 * Second, see if we know about this toplevel vdev.  Add it if its
 	 * missing.
 	 */
 	for (ve = pe->pe_vdevs; ve != NULL; ve = ve->ve_next) {
 		if (ve->ve_guid == top_guid)
 			break;
 	}
 
 	if (ve == NULL) {
 		if ((ve = zfs_alloc(hdl, sizeof (vdev_entry_t))) == NULL) {
 			nvlist_free(config);
 			return (-1);
 		}
 		ve->ve_guid = top_guid;
 		ve->ve_next = pe->pe_vdevs;
 		pe->pe_vdevs = ve;
 	}
 
 	/*
 	 * Third, see if we have a config with a matching transaction group.  If
 	 * so, then we do nothing.  Otherwise, add it to the list of known
 	 * configs.
 	 */
 	for (ce = ve->ve_configs; ce != NULL; ce = ce->ce_next) {
 		if (ce->ce_txg == txg)
 			break;
 	}
 
 	if (ce == NULL) {
 		if ((ce = zfs_alloc(hdl, sizeof (config_entry_t))) == NULL) {
 			nvlist_free(config);
 			return (-1);
 		}
 		ce->ce_txg = txg;
 		ce->ce_config = config;
 		ce->ce_next = ve->ve_configs;
 		ve->ve_configs = ce;
 	} else {
 		nvlist_free(config);
 	}
 
 	/*
 	 * At this point we've successfully added our config to the list of
 	 * known configs.  The last thing to do is add the vdev guid -> path
 	 * mappings so that we can fix up the configuration as necessary before
 	 * doing the import.
 	 */
 	if ((ne = zfs_alloc(hdl, sizeof (name_entry_t))) == NULL)
 		return (-1);
 
 	if ((ne->ne_name = zfs_strdup(hdl, path)) == NULL) {
 		free(ne);
 		return (-1);
 	}
 
 	ne->ne_guid = vdev_guid;
 	ne->ne_next = pl->names;
 	pl->names = ne;
 
 	return (0);
 }
 
 /*
  * Returns true if the named pool matches the given GUID.
  */
 static int
 pool_active(libzfs_handle_t *hdl, const char *name, uint64_t guid,
     boolean_t *isactive)
 {
 	zpool_handle_t *zhp;
 	uint64_t theguid;
 
 	if (zpool_open_silent(hdl, name, &zhp) != 0)
 		return (-1);
 
 	if (zhp == NULL) {
 		*isactive = B_FALSE;
 		return (0);
 	}
 
 	verify(nvlist_lookup_uint64(zhp->zpool_config, ZPOOL_CONFIG_POOL_GUID,
 	    &theguid) == 0);
 
 	zpool_close(zhp);
 
 	*isactive = (theguid == guid);
 	return (0);
 }
 
 static nvlist_t *
 refresh_config(libzfs_handle_t *hdl, nvlist_t *config)
 {
 	nvlist_t *nvl;
 	zfs_cmd_t zc = { 0 };
 	int err, dstbuf_size;
 
 	if (zcmd_write_conf_nvlist(hdl, &zc, config) != 0)
 		return (NULL);
 
 	dstbuf_size = MAX(CONFIG_BUF_MINSIZE, zc.zc_nvlist_conf_size * 4);
 
 	if (zcmd_alloc_dst_nvlist(hdl, &zc, dstbuf_size) != 0) {
 		zcmd_free_nvlists(&zc);
 		return (NULL);
 	}
 
 	while ((err = ioctl(hdl->libzfs_fd, ZFS_IOC_POOL_TRYIMPORT,
 	    &zc)) != 0 && errno == ENOMEM) {
 		if (zcmd_expand_dst_nvlist(hdl, &zc) != 0) {
 			zcmd_free_nvlists(&zc);
 			return (NULL);
 		}
 	}
 
 	if (err) {
 		zcmd_free_nvlists(&zc);
 		return (NULL);
 	}
 
 	if (zcmd_read_dst_nvlist(hdl, &zc, &nvl) != 0) {
 		zcmd_free_nvlists(&zc);
 		return (NULL);
 	}
 
 	zcmd_free_nvlists(&zc);
 	return (nvl);
 }
 
 /*
  * Determine if the vdev id is a hole in the namespace.
  */
 boolean_t
 vdev_is_hole(uint64_t *hole_array, uint_t holes, uint_t id)
 {
 	for (int c = 0; c < holes; c++) {
 
 		/* Top-level is a hole */
 		if (hole_array[c] == id)
 			return (B_TRUE);
 	}
 	return (B_FALSE);
 }
 
 /*
  * Convert our list of pools into the definitive set of configurations.  We
  * start by picking the best config for each toplevel vdev.  Once that's done,
  * we assemble the toplevel vdevs into a full config for the pool.  We make a
  * pass to fix up any incorrect paths, and then add it to the main list to
  * return to the user.
  */
 static nvlist_t *
 get_configs(libzfs_handle_t *hdl, pool_list_t *pl, boolean_t active_ok)
 {
 	pool_entry_t *pe;
 	vdev_entry_t *ve;
 	config_entry_t *ce;
 	nvlist_t *ret = NULL, *config = NULL, *tmp = NULL, *nvtop, *nvroot;
 	nvlist_t **spares, **l2cache;
 	uint_t i, nspares, nl2cache;
 	boolean_t config_seen;
 	uint64_t best_txg;
 	char *name, *hostname = NULL;
 	uint64_t guid;
 	uint_t children = 0;
 	nvlist_t **child = NULL;
 	uint_t holes;
 	uint64_t *hole_array, max_id;
 	uint_t c;
 	boolean_t isactive;
 	uint64_t hostid;
 	nvlist_t *nvl;
 	boolean_t found_one = B_FALSE;
 	boolean_t valid_top_config = B_FALSE;
 
 	if (nvlist_alloc(&ret, 0, 0) != 0)
 		goto nomem;
 
 	for (pe = pl->pools; pe != NULL; pe = pe->pe_next) {
 		uint64_t id, max_txg = 0;
 
 		if (nvlist_alloc(&config, NV_UNIQUE_NAME, 0) != 0)
 			goto nomem;
 		config_seen = B_FALSE;
 
 		/*
 		 * Iterate over all toplevel vdevs.  Grab the pool configuration
 		 * from the first one we find, and then go through the rest and
 		 * add them as necessary to the 'vdevs' member of the config.
 		 */
 		for (ve = pe->pe_vdevs; ve != NULL; ve = ve->ve_next) {
 
 			/*
 			 * Determine the best configuration for this vdev by
 			 * selecting the config with the latest transaction
 			 * group.
 			 */
 			best_txg = 0;
 			for (ce = ve->ve_configs; ce != NULL;
 			    ce = ce->ce_next) {
 
 				if (ce->ce_txg > best_txg) {
 					tmp = ce->ce_config;
 					best_txg = ce->ce_txg;
 				}
 			}
 
 			/*
 			 * We rely on the fact that the max txg for the
 			 * pool will contain the most up-to-date information
 			 * about the valid top-levels in the vdev namespace.
 			 */
 			if (best_txg > max_txg) {
 				(void) nvlist_remove(config,
 				    ZPOOL_CONFIG_VDEV_CHILDREN,
 				    DATA_TYPE_UINT64);
 				(void) nvlist_remove(config,
 				    ZPOOL_CONFIG_HOLE_ARRAY,
 				    DATA_TYPE_UINT64_ARRAY);
 
 				max_txg = best_txg;
 				hole_array = NULL;
 				holes = 0;
 				max_id = 0;
 				valid_top_config = B_FALSE;
 
 				if (nvlist_lookup_uint64(tmp,
 				    ZPOOL_CONFIG_VDEV_CHILDREN, &max_id) == 0) {
 					verify(nvlist_add_uint64(config,
 					    ZPOOL_CONFIG_VDEV_CHILDREN,
 					    max_id) == 0);
 					valid_top_config = B_TRUE;
 				}
 
 				if (nvlist_lookup_uint64_array(tmp,
 				    ZPOOL_CONFIG_HOLE_ARRAY, &hole_array,
 				    &holes) == 0) {
 					verify(nvlist_add_uint64_array(config,
 					    ZPOOL_CONFIG_HOLE_ARRAY,
 					    hole_array, holes) == 0);
 				}
 			}
 
 			if (!config_seen) {
 				/*
 				 * Copy the relevant pieces of data to the pool
 				 * configuration:
 				 *
 				 *	version
 				 *	pool guid
 				 *	name
 				 *	comment (if available)
 				 *	pool state
 				 *	hostid (if available)
 				 *	hostname (if available)
 				 */
 				uint64_t state, version;
 				char *comment = NULL;
 
 				version = fnvlist_lookup_uint64(tmp,
 				    ZPOOL_CONFIG_VERSION);
 				fnvlist_add_uint64(config,
 				    ZPOOL_CONFIG_VERSION, version);
 				guid = fnvlist_lookup_uint64(tmp,
 				    ZPOOL_CONFIG_POOL_GUID);
 				fnvlist_add_uint64(config,
 				    ZPOOL_CONFIG_POOL_GUID, guid);
 				name = fnvlist_lookup_string(tmp,
 				    ZPOOL_CONFIG_POOL_NAME);
 				fnvlist_add_string(config,
 				    ZPOOL_CONFIG_POOL_NAME, name);
 
 				if (nvlist_lookup_string(tmp,
 				    ZPOOL_CONFIG_COMMENT, &comment) == 0)
 					fnvlist_add_string(config,
 					    ZPOOL_CONFIG_COMMENT, comment);
 
 				state = fnvlist_lookup_uint64(tmp,
 				    ZPOOL_CONFIG_POOL_STATE);
 				fnvlist_add_uint64(config,
 				    ZPOOL_CONFIG_POOL_STATE, state);
 
 				hostid = 0;
 				if (nvlist_lookup_uint64(tmp,
 				    ZPOOL_CONFIG_HOSTID, &hostid) == 0) {
 					fnvlist_add_uint64(config,
 					    ZPOOL_CONFIG_HOSTID, hostid);
 					hostname = fnvlist_lookup_string(tmp,
 					    ZPOOL_CONFIG_HOSTNAME);
 					fnvlist_add_string(config,
 					    ZPOOL_CONFIG_HOSTNAME, hostname);
 				}
 
 				config_seen = B_TRUE;
 			}
 
 			/*
 			 * Add this top-level vdev to the child array.
 			 */
 			verify(nvlist_lookup_nvlist(tmp,
 			    ZPOOL_CONFIG_VDEV_TREE, &nvtop) == 0);
 			verify(nvlist_lookup_uint64(nvtop, ZPOOL_CONFIG_ID,
 			    &id) == 0);
 
 			if (id >= children) {
 				nvlist_t **newchild;
 
 				newchild = zfs_alloc(hdl, (id + 1) *
 				    sizeof (nvlist_t *));
 				if (newchild == NULL)
 					goto nomem;
 
 				for (c = 0; c < children; c++)
 					newchild[c] = child[c];
 
 				free(child);
 				child = newchild;
 				children = id + 1;
 			}
 			if (nvlist_dup(nvtop, &child[id], 0) != 0)
 				goto nomem;
 
 		}
 
 		/*
 		 * If we have information about all the top-levels then
 		 * clean up the nvlist which we've constructed. This
 		 * means removing any extraneous devices that are
 		 * beyond the valid range or adding devices to the end
 		 * of our array which appear to be missing.
 		 */
 		if (valid_top_config) {
 			if (max_id < children) {
 				for (c = max_id; c < children; c++)
 					nvlist_free(child[c]);
 				children = max_id;
 			} else if (max_id > children) {
 				nvlist_t **newchild;
 
 				newchild = zfs_alloc(hdl, (max_id) *
 				    sizeof (nvlist_t *));
 				if (newchild == NULL)
 					goto nomem;
 
 				for (c = 0; c < children; c++)
 					newchild[c] = child[c];
 
 				free(child);
 				child = newchild;
 				children = max_id;
 			}
 		}
 
 		verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID,
 		    &guid) == 0);
 
 		/*
 		 * The vdev namespace may contain holes as a result of
 		 * device removal. We must add them back into the vdev
 		 * tree before we process any missing devices.
 		 */
 		if (holes > 0) {
 			ASSERT(valid_top_config);
 
 			for (c = 0; c < children; c++) {
 				nvlist_t *holey;
 
 				if (child[c] != NULL ||
 				    !vdev_is_hole(hole_array, holes, c))
 					continue;
 
 				if (nvlist_alloc(&holey, NV_UNIQUE_NAME,
 				    0) != 0)
 					goto nomem;
 
 				/*
 				 * Holes in the namespace are treated as
 				 * "hole" top-level vdevs and have a
 				 * special flag set on them.
 				 */
 				if (nvlist_add_string(holey,
 				    ZPOOL_CONFIG_TYPE,
 				    VDEV_TYPE_HOLE) != 0 ||
 				    nvlist_add_uint64(holey,
 				    ZPOOL_CONFIG_ID, c) != 0 ||
 				    nvlist_add_uint64(holey,
 				    ZPOOL_CONFIG_GUID, 0ULL) != 0) {
 					nvlist_free(holey);
 					goto nomem;
 				}
 				child[c] = holey;
 			}
 		}
 
 		/*
 		 * Look for any missing top-level vdevs.  If this is the case,
 		 * create a faked up 'missing' vdev as a placeholder.  We cannot
 		 * simply compress the child array, because the kernel performs
 		 * certain checks to make sure the vdev IDs match their location
 		 * in the configuration.
 		 */
 		for (c = 0; c < children; c++) {
 			if (child[c] == NULL) {
 				nvlist_t *missing;
 				if (nvlist_alloc(&missing, NV_UNIQUE_NAME,
 				    0) != 0)
 					goto nomem;
 				if (nvlist_add_string(missing,
 				    ZPOOL_CONFIG_TYPE,
 				    VDEV_TYPE_MISSING) != 0 ||
 				    nvlist_add_uint64(missing,
 				    ZPOOL_CONFIG_ID, c) != 0 ||
 				    nvlist_add_uint64(missing,
 				    ZPOOL_CONFIG_GUID, 0ULL) != 0) {
 					nvlist_free(missing);
 					goto nomem;
 				}
 				child[c] = missing;
 			}
 		}
 
 		/*
 		 * Put all of this pool's top-level vdevs into a root vdev.
 		 */
 		if (nvlist_alloc(&nvroot, NV_UNIQUE_NAME, 0) != 0)
 			goto nomem;
 		if (nvlist_add_string(nvroot, ZPOOL_CONFIG_TYPE,
 		    VDEV_TYPE_ROOT) != 0 ||
 		    nvlist_add_uint64(nvroot, ZPOOL_CONFIG_ID, 0ULL) != 0 ||
 		    nvlist_add_uint64(nvroot, ZPOOL_CONFIG_GUID, guid) != 0 ||
 		    nvlist_add_nvlist_array(nvroot, ZPOOL_CONFIG_CHILDREN,
 		    child, children) != 0) {
 			nvlist_free(nvroot);
 			goto nomem;
 		}
 
 		for (c = 0; c < children; c++)
 			nvlist_free(child[c]);
 		free(child);
 		children = 0;
 		child = NULL;
 
 		/*
 		 * Go through and fix up any paths and/or devids based on our
 		 * known list of vdev GUID -> path mappings.
 		 */
 		if (fix_paths(nvroot, pl->names) != 0) {
 			nvlist_free(nvroot);
 			goto nomem;
 		}
 
 		/*
 		 * Add the root vdev to this pool's configuration.
 		 */
 		if (nvlist_add_nvlist(config, ZPOOL_CONFIG_VDEV_TREE,
 		    nvroot) != 0) {
 			nvlist_free(nvroot);
 			goto nomem;
 		}
 		nvlist_free(nvroot);
 
 		/*
 		 * zdb uses this path to report on active pools that were
 		 * imported or created using -R.
 		 */
 		if (active_ok)
 			goto add_pool;
 
 		/*
 		 * Determine if this pool is currently active, in which case we
 		 * can't actually import it.
 		 */
 		verify(nvlist_lookup_string(config, ZPOOL_CONFIG_POOL_NAME,
 		    &name) == 0);
 		verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID,
 		    &guid) == 0);
 
 		if (pool_active(hdl, name, guid, &isactive) != 0)
 			goto error;
 
 		if (isactive) {
 			nvlist_free(config);
 			config = NULL;
 			continue;
 		}
 
 		if ((nvl = refresh_config(hdl, config)) == NULL) {
 			nvlist_free(config);
 			config = NULL;
 			continue;
 		}
 
 		nvlist_free(config);
 		config = nvl;
 
 		/*
 		 * Go through and update the paths for spares, now that we have
 		 * them.
 		 */
 		verify(nvlist_lookup_nvlist(config, ZPOOL_CONFIG_VDEV_TREE,
 		    &nvroot) == 0);
 		if (nvlist_lookup_nvlist_array(nvroot, ZPOOL_CONFIG_SPARES,
 		    &spares, &nspares) == 0) {
 			for (i = 0; i < nspares; i++) {
 				if (fix_paths(spares[i], pl->names) != 0)
 					goto nomem;
 			}
 		}
 
 		/*
 		 * Update the paths for l2cache devices.
 		 */
 		if (nvlist_lookup_nvlist_array(nvroot, ZPOOL_CONFIG_L2CACHE,
 		    &l2cache, &nl2cache) == 0) {
 			for (i = 0; i < nl2cache; i++) {
 				if (fix_paths(l2cache[i], pl->names) != 0)
 					goto nomem;
 			}
 		}
 
 		/*
 		 * Restore the original information read from the actual label.
 		 */
 		(void) nvlist_remove(config, ZPOOL_CONFIG_HOSTID,
 		    DATA_TYPE_UINT64);
 		(void) nvlist_remove(config, ZPOOL_CONFIG_HOSTNAME,
 		    DATA_TYPE_STRING);
 		if (hostid != 0) {
 			verify(nvlist_add_uint64(config, ZPOOL_CONFIG_HOSTID,
 			    hostid) == 0);
 			verify(nvlist_add_string(config, ZPOOL_CONFIG_HOSTNAME,
 			    hostname) == 0);
 		}
 
 add_pool:
 		/*
 		 * Add this pool to the list of configs.
 		 */
 		verify(nvlist_lookup_string(config, ZPOOL_CONFIG_POOL_NAME,
 		    &name) == 0);
 		if (nvlist_add_nvlist(ret, name, config) != 0)
 			goto nomem;
 
 		found_one = B_TRUE;
 		nvlist_free(config);
 		config = NULL;
 	}
 
 	if (!found_one) {
 		nvlist_free(ret);
 		ret = NULL;
 	}
 
 	return (ret);
 
 nomem:
 	(void) no_memory(hdl);
 error:
 	nvlist_free(config);
 	nvlist_free(ret);
 	for (c = 0; c < children; c++)
 		nvlist_free(child[c]);
 	free(child);
 
 	return (NULL);
 }
 
 /*
  * Return the offset of the given label.
  */
 static uint64_t
 label_offset(uint64_t size, int l)
 {
 	ASSERT(P2PHASE_TYPED(size, sizeof (vdev_label_t), uint64_t) == 0);
 	return (l * sizeof (vdev_label_t) + (l < VDEV_LABELS / 2 ?
 	    0 : size - VDEV_LABELS * sizeof (vdev_label_t)));
 }
 
 /*
  * Given a file descriptor, read the label information and return an nvlist
  * describing the configuration, if there is one.
  * Return 0 on success, or -1 on failure
  */
 int
 zpool_read_label(int fd, nvlist_t **config)
 {
 	struct stat64 statbuf;
 	int l;
 	vdev_label_t *label;
 	uint64_t state, txg, size;
 
 	*config = NULL;
 
 	if (fstat64(fd, &statbuf) == -1)
 		return (-1);
 	size = P2ALIGN_TYPED(statbuf.st_size, sizeof (vdev_label_t), uint64_t);
 
 	if ((label = malloc(sizeof (vdev_label_t))) == NULL)
 		return (-1);
 
 	for (l = 0; l < VDEV_LABELS; l++) {
 		if (pread64(fd, label, sizeof (vdev_label_t),
 		    label_offset(size, l)) != sizeof (vdev_label_t))
 			continue;
 
 		if (nvlist_unpack(label->vl_vdev_phys.vp_nvlist,
 		    sizeof (label->vl_vdev_phys.vp_nvlist), config, 0) != 0)
 			continue;
 
 		if (nvlist_lookup_uint64(*config, ZPOOL_CONFIG_POOL_STATE,
 		    &state) != 0 || state > POOL_STATE_L2CACHE) {
 			nvlist_free(*config);
 			continue;
 		}
 
 		if (state != POOL_STATE_SPARE && state != POOL_STATE_L2CACHE &&
 		    (nvlist_lookup_uint64(*config, ZPOOL_CONFIG_POOL_TXG,
 		    &txg) != 0 || txg == 0)) {
 			nvlist_free(*config);
 			continue;
 		}
 
 		free(label);
 		return (0);
 	}
 
 	free(label);
 	*config = NULL;
 	return (-1);
+}
+
+/*
+ * Given a file descriptor, read the label information and return an nvlist
+ * describing the configuration, if there is one.
+ * returns the number of valid labels found
+ * If a label is found, returns it via config.  The caller is responsible for
+ * freeing it.
+ */
+int
+zpool_read_all_labels(int fd, nvlist_t **config)
+{
+	struct stat64 statbuf;
+	struct aiocb aiocbs[VDEV_LABELS];
+	struct aiocb *aiocbps[VDEV_LABELS];
+	int l;
+	vdev_phys_t *labels;
+	uint64_t state, txg, size;
+	int nlabels = 0;
+
+	*config = NULL;
+
+	if (fstat64(fd, &statbuf) == -1)
+		return (0);
+	size = P2ALIGN_TYPED(statbuf.st_size, sizeof (vdev_label_t), uint64_t);
+
+	if ((labels = calloc(VDEV_LABELS, sizeof (vdev_phys_t))) == NULL)
+		return (0);
+
+	memset(aiocbs, 0, sizeof(aiocbs));
+	for (l = 0; l < VDEV_LABELS; l++) {
+		aiocbs[l].aio_fildes = fd;
+		aiocbs[l].aio_offset = label_offset(size, l) + VDEV_SKIP_SIZE;
+		aiocbs[l].aio_buf = &labels[l];
+		aiocbs[l].aio_nbytes = sizeof(vdev_phys_t);
+		aiocbs[l].aio_lio_opcode = LIO_READ;
+		aiocbps[l] = &aiocbs[l];
+	}
+
+	if (lio_listio(LIO_WAIT, aiocbps, VDEV_LABELS, NULL) != 0) {
+		if (errno == EAGAIN || errno == EINTR || errno == EIO) {
+			for (l = 0; l < VDEV_LABELS; l++) {
+				errno = 0;
+				int r = aio_error(&aiocbs[l]);
+				if (r != EINVAL)
+					(void)aio_return(&aiocbs[l]);
+			}
+		}
+		free(labels);
+		return (0);
+	}
+
+	for (l = 0; l < VDEV_LABELS; l++) {
+		nvlist_t *temp = NULL;
+
+		if (aio_return(&aiocbs[l]) != sizeof(vdev_phys_t))
+			continue;
+
+		if (nvlist_unpack(labels[l].vp_nvlist,
+		    sizeof (labels[l].vp_nvlist), &temp, 0) != 0)
+			continue;
+
+		if (nvlist_lookup_uint64(temp, ZPOOL_CONFIG_POOL_STATE,
+		    &state) != 0 || state > POOL_STATE_L2CACHE) {
+			nvlist_free(temp);
+			temp = NULL;
+			continue;
+		}
+
+		if (state != POOL_STATE_SPARE && state != POOL_STATE_L2CACHE &&
+		    (nvlist_lookup_uint64(temp, ZPOOL_CONFIG_POOL_TXG,
+		    &txg) != 0 || txg == 0)) {
+			nvlist_free(temp);
+			temp = NULL;
+			continue;
+		}
+		if (temp)
+			*config = temp;
+
+		nlabels++;
+	}
+
+	free(labels);
+	return (nlabels);
 }
 
 typedef struct rdsk_node {
 	char *rn_name;
 	int rn_dfd;
 	libzfs_handle_t *rn_hdl;
 	nvlist_t *rn_config;
 	avl_tree_t *rn_avl;
 	avl_node_t rn_node;
 	boolean_t rn_nozpool;
 } rdsk_node_t;
 
 static int
 slice_cache_compare(const void *arg1, const void *arg2)
 {
 	const char  *nm1 = ((rdsk_node_t *)arg1)->rn_name;
 	const char  *nm2 = ((rdsk_node_t *)arg2)->rn_name;
 	char *nm1slice, *nm2slice;
 	int rv;
 
 	/*
 	 * slices zero and two are the most likely to provide results,
 	 * so put those first
 	 */
 	nm1slice = strstr(nm1, "s0");
 	nm2slice = strstr(nm2, "s0");
 	if (nm1slice && !nm2slice) {
 		return (-1);
 	}
 	if (!nm1slice && nm2slice) {
 		return (1);
 	}
 	nm1slice = strstr(nm1, "s2");
 	nm2slice = strstr(nm2, "s2");
 	if (nm1slice && !nm2slice) {
 		return (-1);
 	}
 	if (!nm1slice && nm2slice) {
 		return (1);
 	}
 
 	rv = strcmp(nm1, nm2);
 	if (rv == 0)
 		return (0);
 	return (rv > 0 ? 1 : -1);
 }
 
 #ifdef illumos
 static void
 check_one_slice(avl_tree_t *r, char *diskname, uint_t partno,
     diskaddr_t size, uint_t blksz)
 {
 	rdsk_node_t tmpnode;
 	rdsk_node_t *node;
 	char sname[MAXNAMELEN];
 
 	tmpnode.rn_name = &sname[0];
 	(void) snprintf(tmpnode.rn_name, MAXNAMELEN, "%s%u",
 	    diskname, partno);
 	/*
 	 * protect against division by zero for disk labels that
 	 * contain a bogus sector size
 	 */
 	if (blksz == 0)
 		blksz = DEV_BSIZE;
 	/* too small to contain a zpool? */
 	if ((size < (SPA_MINDEVSIZE / blksz)) &&
 	    (node = avl_find(r, &tmpnode, NULL)))
 		node->rn_nozpool = B_TRUE;
 }
 #endif	/* illumos */
 
 static void
 nozpool_all_slices(avl_tree_t *r, const char *sname)
 {
 #ifdef illumos
 	char diskname[MAXNAMELEN];
 	char *ptr;
 	int i;
 
 	(void) strncpy(diskname, sname, MAXNAMELEN);
 	if (((ptr = strrchr(diskname, 's')) == NULL) &&
 	    ((ptr = strrchr(diskname, 'p')) == NULL))
 		return;
 	ptr[0] = 's';
 	ptr[1] = '\0';
 	for (i = 0; i < NDKMAP; i++)
 		check_one_slice(r, diskname, i, 0, 1);
 	ptr[0] = 'p';
 	for (i = 0; i <= FD_NUMPART; i++)
 		check_one_slice(r, diskname, i, 0, 1);
 #endif	/* illumos */
 }
 
 #ifdef illumos
 static void
 check_slices(avl_tree_t *r, int fd, const char *sname)
 {
 	struct extvtoc vtoc;
 	struct dk_gpt *gpt;
 	char diskname[MAXNAMELEN];
 	char *ptr;
 	int i;
 
 	(void) strncpy(diskname, sname, MAXNAMELEN);
 	if ((ptr = strrchr(diskname, 's')) == NULL || !isdigit(ptr[1]))
 		return;
 	ptr[1] = '\0';
 
 	if (read_extvtoc(fd, &vtoc) >= 0) {
 		for (i = 0; i < NDKMAP; i++)
 			check_one_slice(r, diskname, i,
 			    vtoc.v_part[i].p_size, vtoc.v_sectorsz);
 	} else if (efi_alloc_and_read(fd, &gpt) >= 0) {
 		/*
 		 * on x86 we'll still have leftover links that point
 		 * to slices s[9-15], so use NDKMAP instead
 		 */
 		for (i = 0; i < NDKMAP; i++)
 			check_one_slice(r, diskname, i,
 			    gpt->efi_parts[i].p_size, gpt->efi_lbasize);
 		/* nodes p[1-4] are never used with EFI labels */
 		ptr[0] = 'p';
 		for (i = 1; i <= FD_NUMPART; i++)
 			check_one_slice(r, diskname, i, 0, 1);
 		efi_free(gpt);
 	}
 }
 #endif	/* illumos */
 
 static void
 zpool_open_func(void *arg)
 {
 	rdsk_node_t *rn = arg;
 	struct stat64 statbuf;
 	nvlist_t *config;
 	int fd;
 
 	if (rn->rn_nozpool)
 		return;
 	if ((fd = openat64(rn->rn_dfd, rn->rn_name, O_RDONLY)) < 0) {
 		/* symlink to a device that's no longer there */
 		if (errno == ENOENT)
 			nozpool_all_slices(rn->rn_avl, rn->rn_name);
 		return;
 	}
 	/*
 	 * Ignore failed stats.  We only want regular
 	 * files, character devs and block devs.
 	 */
 	if (fstat64(fd, &statbuf) != 0 ||
 	    (!S_ISREG(statbuf.st_mode) &&
 	    !S_ISCHR(statbuf.st_mode) &&
 	    !S_ISBLK(statbuf.st_mode))) {
 		(void) close(fd);
 		return;
 	}
 	/* this file is too small to hold a zpool */
 #ifdef illumos
 	if (S_ISREG(statbuf.st_mode) &&
 	    statbuf.st_size < SPA_MINDEVSIZE) {
 		(void) close(fd);
 		return;
 	} else if (!S_ISREG(statbuf.st_mode)) {
 		/*
 		 * Try to read the disk label first so we don't have to
 		 * open a bunch of minor nodes that can't have a zpool.
 		 */
 		check_slices(rn->rn_avl, fd, rn->rn_name);
 	}
 #else	/* !illumos */
 	if (statbuf.st_size < SPA_MINDEVSIZE) {
 		(void) close(fd);
 		return;
 	}
 #endif	/* illumos */
 
 	if ((zpool_read_label(fd, &config)) != 0 && errno == ENOMEM) {
 		(void) close(fd);
 		(void) no_memory(rn->rn_hdl);
 		return;
 	}
 	(void) close(fd);
 
 	rn->rn_config = config;
 }
 
 /*
  * Given a file descriptor, clear (zero) the label information.
  */
 int
 zpool_clear_label(int fd)
 {
 	struct stat64 statbuf;
 	int l;
 	vdev_label_t *label;
 	uint64_t size;
 
 	if (fstat64(fd, &statbuf) == -1)
 		return (0);
 	size = P2ALIGN_TYPED(statbuf.st_size, sizeof (vdev_label_t), uint64_t);
 
 	if ((label = calloc(sizeof (vdev_label_t), 1)) == NULL)
 		return (-1);
 
 	for (l = 0; l < VDEV_LABELS; l++) {
 		if (pwrite64(fd, label, sizeof (vdev_label_t),
 		    label_offset(size, l)) != sizeof (vdev_label_t)) {
 			free(label);
 			return (-1);
 		}
 	}
 
 	free(label);
 	return (0);
 }
 
 /*
  * Given a list of directories to search, find all pools stored on disk.  This
  * includes partial pools which are not available to import.  If no args are
  * given (argc is 0), then the default directory (/dev/dsk) is searched.
  * poolname or guid (but not both) are provided by the caller when trying
  * to import a specific pool.
  */
 static nvlist_t *
 zpool_find_import_impl(libzfs_handle_t *hdl, importargs_t *iarg)
 {
 	int i, dirs = iarg->paths;
 	struct dirent64 *dp;
 	char path[MAXPATHLEN];
 	char *end, **dir = iarg->path;
 	size_t pathleft;
 	nvlist_t *ret = NULL;
 	static char *default_dir = "/dev";
 	pool_list_t pools = { 0 };
 	pool_entry_t *pe, *penext;
 	vdev_entry_t *ve, *venext;
 	config_entry_t *ce, *cenext;
 	name_entry_t *ne, *nenext;
 	avl_tree_t slice_cache;
 	rdsk_node_t *slice;
 	void *cookie;
 
 	if (dirs == 0) {
 		dirs = 1;
 		dir = &default_dir;
 	}
 
 	/*
 	 * Go through and read the label configuration information from every
 	 * possible device, organizing the information according to pool GUID
 	 * and toplevel GUID.
 	 */
 	for (i = 0; i < dirs; i++) {
 		tpool_t *t;
 		char rdsk[MAXPATHLEN];
 		int dfd;
 		boolean_t config_failed = B_FALSE;
 		DIR *dirp;
 
 		/* use realpath to normalize the path */
 		if (realpath(dir[i], path) == 0) {
 			(void) zfs_error_fmt(hdl, EZFS_BADPATH,
 			    dgettext(TEXT_DOMAIN, "cannot open '%s'"), dir[i]);
 			goto error;
 		}
 		end = &path[strlen(path)];
 		*end++ = '/';
 		*end = 0;
 		pathleft = &path[sizeof (path)] - end;
 
 #ifdef illumos
 		/*
 		 * Using raw devices instead of block devices when we're
 		 * reading the labels skips a bunch of slow operations during
 		 * close(2) processing, so we replace /dev/dsk with /dev/rdsk.
 		 */
 		if (strcmp(path, ZFS_DISK_ROOTD) == 0)
 			(void) strlcpy(rdsk, ZFS_RDISK_ROOTD, sizeof (rdsk));
 		else
 #endif
 			(void) strlcpy(rdsk, path, sizeof (rdsk));
 
 		if ((dfd = open64(rdsk, O_RDONLY)) < 0 ||
 		    (dirp = fdopendir(dfd)) == NULL) {
 			if (dfd >= 0)
 				(void) close(dfd);
 			zfs_error_aux(hdl, strerror(errno));
 			(void) zfs_error_fmt(hdl, EZFS_BADPATH,
 			    dgettext(TEXT_DOMAIN, "cannot open '%s'"),
 			    rdsk);
 			goto error;
 		}
 
 		avl_create(&slice_cache, slice_cache_compare,
 		    sizeof (rdsk_node_t), offsetof(rdsk_node_t, rn_node));
 
 		if (strcmp(rdsk, "/dev/") == 0) {
 			struct gmesh mesh;
 			struct gclass *mp;
 			struct ggeom *gp;
 			struct gprovider *pp;
 
 			errno = geom_gettree(&mesh);
 			if (errno != 0) {
 				zfs_error_aux(hdl, strerror(errno));
 				(void) zfs_error_fmt(hdl, EZFS_BADPATH,
 				    dgettext(TEXT_DOMAIN, "cannot get GEOM tree"));
 				goto error;
 			}
 
 			LIST_FOREACH(mp, &mesh.lg_class, lg_class) {
 		        	LIST_FOREACH(gp, &mp->lg_geom, lg_geom) {
 					LIST_FOREACH(pp, &gp->lg_provider, lg_provider) {
 						slice = zfs_alloc(hdl, sizeof (rdsk_node_t));
 						slice->rn_name = zfs_strdup(hdl, pp->lg_name);
 						slice->rn_avl = &slice_cache;
 						slice->rn_dfd = dfd;
 						slice->rn_hdl = hdl;
 						slice->rn_nozpool = B_FALSE;
 						avl_add(&slice_cache, slice);
 					}
 				}
 			}
 
 			geom_deletetree(&mesh);
 			goto skipdir;
 		}
 
 		/*
 		 * This is not MT-safe, but we have no MT consumers of libzfs
 		 */
 		while ((dp = readdir64(dirp)) != NULL) {
 			const char *name = dp->d_name;
 			if (name[0] == '.' &&
 			    (name[1] == 0 || (name[1] == '.' && name[2] == 0)))
 				continue;
 
 			slice = zfs_alloc(hdl, sizeof (rdsk_node_t));
 			slice->rn_name = zfs_strdup(hdl, name);
 			slice->rn_avl = &slice_cache;
 			slice->rn_dfd = dfd;
 			slice->rn_hdl = hdl;
 			slice->rn_nozpool = B_FALSE;
 			avl_add(&slice_cache, slice);
 		}
 skipdir:
 		/*
 		 * create a thread pool to do all of this in parallel;
 		 * rn_nozpool is not protected, so this is racy in that
 		 * multiple tasks could decide that the same slice can
 		 * not hold a zpool, which is benign.  Also choose
 		 * double the number of processors; we hold a lot of
 		 * locks in the kernel, so going beyond this doesn't
 		 * buy us much.
 		 */
 		t = tpool_create(1, 2 * sysconf(_SC_NPROCESSORS_ONLN),
 		    0, NULL);
 		for (slice = avl_first(&slice_cache); slice;
 		    (slice = avl_walk(&slice_cache, slice,
 		    AVL_AFTER)))
 			(void) tpool_dispatch(t, zpool_open_func, slice);
 		tpool_wait(t);
 		tpool_destroy(t);
 
 		cookie = NULL;
 		while ((slice = avl_destroy_nodes(&slice_cache,
 		    &cookie)) != NULL) {
 			if (slice->rn_config != NULL && !config_failed) {
 				nvlist_t *config = slice->rn_config;
 				boolean_t matched = B_TRUE;
 
 				if (iarg->poolname != NULL) {
 					char *pname;
 
 					matched = nvlist_lookup_string(config,
 					    ZPOOL_CONFIG_POOL_NAME,
 					    &pname) == 0 &&
 					    strcmp(iarg->poolname, pname) == 0;
 				} else if (iarg->guid != 0) {
 					uint64_t this_guid;
 
 					matched = nvlist_lookup_uint64(config,
 					    ZPOOL_CONFIG_POOL_GUID,
 					    &this_guid) == 0 &&
 					    iarg->guid == this_guid;
 				}
 				if (!matched) {
 					nvlist_free(config);
 				} else {
 					/*
 					 * use the non-raw path for the config
 					 */
 					(void) strlcpy(end, slice->rn_name,
 					    pathleft);
 					if (add_config(hdl, &pools, path,
 					    config) != 0)
 						config_failed = B_TRUE;
 				}
 			}
 			free(slice->rn_name);
 			free(slice);
 		}
 		avl_destroy(&slice_cache);
 
 		(void) closedir(dirp);
 
 		if (config_failed)
 			goto error;
 	}
 
 	ret = get_configs(hdl, &pools, iarg->can_be_active);
 
 error:
 	for (pe = pools.pools; pe != NULL; pe = penext) {
 		penext = pe->pe_next;
 		for (ve = pe->pe_vdevs; ve != NULL; ve = venext) {
 			venext = ve->ve_next;
 			for (ce = ve->ve_configs; ce != NULL; ce = cenext) {
 				cenext = ce->ce_next;
 				nvlist_free(ce->ce_config);
 				free(ce);
 			}
 			free(ve);
 		}
 		free(pe);
 	}
 
 	for (ne = pools.names; ne != NULL; ne = nenext) {
 		nenext = ne->ne_next;
 		free(ne->ne_name);
 		free(ne);
 	}
 
 	return (ret);
 }
 
 nvlist_t *
 zpool_find_import(libzfs_handle_t *hdl, int argc, char **argv)
 {
 	importargs_t iarg = { 0 };
 
 	iarg.paths = argc;
 	iarg.path = argv;
 
 	return (zpool_find_import_impl(hdl, &iarg));
 }
 
 /*
  * Given a cache file, return the contents as a list of importable pools.
  * poolname or guid (but not both) are provided by the caller when trying
  * to import a specific pool.
  */
 nvlist_t *
 zpool_find_import_cached(libzfs_handle_t *hdl, const char *cachefile,
     char *poolname, uint64_t guid)
 {
 	char *buf;
 	int fd;
 	struct stat64 statbuf;
 	nvlist_t *raw, *src, *dst;
 	nvlist_t *pools;
 	nvpair_t *elem;
 	char *name;
 	uint64_t this_guid;
 	boolean_t active;
 
 	verify(poolname == NULL || guid == 0);
 
 	if ((fd = open(cachefile, O_RDONLY)) < 0) {
 		zfs_error_aux(hdl, "%s", strerror(errno));
 		(void) zfs_error(hdl, EZFS_BADCACHE,
 		    dgettext(TEXT_DOMAIN, "failed to open cache file"));
 		return (NULL);
 	}
 
 	if (fstat64(fd, &statbuf) != 0) {
 		zfs_error_aux(hdl, "%s", strerror(errno));
 		(void) close(fd);
 		(void) zfs_error(hdl, EZFS_BADCACHE,
 		    dgettext(TEXT_DOMAIN, "failed to get size of cache file"));
 		return (NULL);
 	}
 
 	if ((buf = zfs_alloc(hdl, statbuf.st_size)) == NULL) {
 		(void) close(fd);
 		return (NULL);
 	}
 
 	if (read(fd, buf, statbuf.st_size) != statbuf.st_size) {
 		(void) close(fd);
 		free(buf);
 		(void) zfs_error(hdl, EZFS_BADCACHE,
 		    dgettext(TEXT_DOMAIN,
 		    "failed to read cache file contents"));
 		return (NULL);
 	}
 
 	(void) close(fd);
 
 	if (nvlist_unpack(buf, statbuf.st_size, &raw, 0) != 0) {
 		free(buf);
 		(void) zfs_error(hdl, EZFS_BADCACHE,
 		    dgettext(TEXT_DOMAIN,
 		    "invalid or corrupt cache file contents"));
 		return (NULL);
 	}
 
 	free(buf);
 
 	/*
 	 * Go through and get the current state of the pools and refresh their
 	 * state.
 	 */
 	if (nvlist_alloc(&pools, 0, 0) != 0) {
 		(void) no_memory(hdl);
 		nvlist_free(raw);
 		return (NULL);
 	}
 
 	elem = NULL;
 	while ((elem = nvlist_next_nvpair(raw, elem)) != NULL) {
 		src = fnvpair_value_nvlist(elem);
 
 		name = fnvlist_lookup_string(src, ZPOOL_CONFIG_POOL_NAME);
 		if (poolname != NULL && strcmp(poolname, name) != 0)
 			continue;
 
 		this_guid = fnvlist_lookup_uint64(src, ZPOOL_CONFIG_POOL_GUID);
 		if (guid != 0 && guid != this_guid)
 			continue;
 
 		if (pool_active(hdl, name, this_guid, &active) != 0) {
 			nvlist_free(raw);
 			nvlist_free(pools);
 			return (NULL);
 		}
 
 		if (active)
 			continue;
 
 		if ((dst = refresh_config(hdl, src)) == NULL) {
 			nvlist_free(raw);
 			nvlist_free(pools);
 			return (NULL);
 		}
 
 		if (nvlist_add_nvlist(pools, nvpair_name(elem), dst) != 0) {
 			(void) no_memory(hdl);
 			nvlist_free(dst);
 			nvlist_free(raw);
 			nvlist_free(pools);
 			return (NULL);
 		}
 		nvlist_free(dst);
 	}
 
 	nvlist_free(raw);
 	return (pools);
 }
 
 static int
 name_or_guid_exists(zpool_handle_t *zhp, void *data)
 {
 	importargs_t *import = data;
 	int found = 0;
 
 	if (import->poolname != NULL) {
 		char *pool_name;
 
 		verify(nvlist_lookup_string(zhp->zpool_config,
 		    ZPOOL_CONFIG_POOL_NAME, &pool_name) == 0);
 		if (strcmp(pool_name, import->poolname) == 0)
 			found = 1;
 	} else {
 		uint64_t pool_guid;
 
 		verify(nvlist_lookup_uint64(zhp->zpool_config,
 		    ZPOOL_CONFIG_POOL_GUID, &pool_guid) == 0);
 		if (pool_guid == import->guid)
 			found = 1;
 	}
 
 	zpool_close(zhp);
 	return (found);
 }
 
 nvlist_t *
 zpool_search_import(libzfs_handle_t *hdl, importargs_t *import)
 {
 	verify(import->poolname == NULL || import->guid == 0);
 
 	if (import->unique)
 		import->exists = zpool_iter(hdl, name_or_guid_exists, import);
 
 	if (import->cachefile != NULL)
 		return (zpool_find_import_cached(hdl, import->cachefile,
 		    import->poolname, import->guid));
 
 	return (zpool_find_import_impl(hdl, import));
 }
 
 boolean_t
 find_guid(nvlist_t *nv, uint64_t guid)
 {
 	uint64_t tmp;
 	nvlist_t **child;
 	uint_t c, children;
 
 	verify(nvlist_lookup_uint64(nv, ZPOOL_CONFIG_GUID, &tmp) == 0);
 	if (tmp == guid)
 		return (B_TRUE);
 
 	if (nvlist_lookup_nvlist_array(nv, ZPOOL_CONFIG_CHILDREN,
 	    &child, &children) == 0) {
 		for (c = 0; c < children; c++)
 			if (find_guid(child[c], guid))
 				return (B_TRUE);
 	}
 
 	return (B_FALSE);
 }
 
 typedef struct aux_cbdata {
 	const char	*cb_type;
 	uint64_t	cb_guid;
 	zpool_handle_t	*cb_zhp;
 } aux_cbdata_t;
 
 static int
 find_aux(zpool_handle_t *zhp, void *data)
 {
 	aux_cbdata_t *cbp = data;
 	nvlist_t **list;
 	uint_t i, count;
 	uint64_t guid;
 	nvlist_t *nvroot;
 
 	verify(nvlist_lookup_nvlist(zhp->zpool_config, ZPOOL_CONFIG_VDEV_TREE,
 	    &nvroot) == 0);
 
 	if (nvlist_lookup_nvlist_array(nvroot, cbp->cb_type,
 	    &list, &count) == 0) {
 		for (i = 0; i < count; i++) {
 			verify(nvlist_lookup_uint64(list[i],
 			    ZPOOL_CONFIG_GUID, &guid) == 0);
 			if (guid == cbp->cb_guid) {
 				cbp->cb_zhp = zhp;
 				return (1);
 			}
 		}
 	}
 
 	zpool_close(zhp);
 	return (0);
 }
 
 /*
  * Determines if the pool is in use.  If so, it returns true and the state of
  * the pool as well as the name of the pool.  Both strings are allocated and
  * must be freed by the caller.
  */
 int
 zpool_in_use(libzfs_handle_t *hdl, int fd, pool_state_t *state, char **namestr,
     boolean_t *inuse)
 {
 	nvlist_t *config;
 	char *name;
 	boolean_t ret;
 	uint64_t guid, vdev_guid;
 	zpool_handle_t *zhp;
 	nvlist_t *pool_config;
 	uint64_t stateval, isspare;
 	aux_cbdata_t cb = { 0 };
 	boolean_t isactive;
 
 	*inuse = B_FALSE;
 
 	if (zpool_read_label(fd, &config) != 0 && errno == ENOMEM) {
 		(void) no_memory(hdl);
 		return (-1);
 	}
 
 	if (config == NULL)
 		return (0);
 
 	verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_STATE,
 	    &stateval) == 0);
 	verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_GUID,
 	    &vdev_guid) == 0);
 
 	if (stateval != POOL_STATE_SPARE && stateval != POOL_STATE_L2CACHE) {
 		verify(nvlist_lookup_string(config, ZPOOL_CONFIG_POOL_NAME,
 		    &name) == 0);
 		verify(nvlist_lookup_uint64(config, ZPOOL_CONFIG_POOL_GUID,
 		    &guid) == 0);
 	}
 
 	switch (stateval) {
 	case POOL_STATE_EXPORTED:
 		/*
 		 * A pool with an exported state may in fact be imported
 		 * read-only, so check the in-core state to see if it's
 		 * active and imported read-only.  If it is, set
 		 * its state to active.
 		 */
 		if (pool_active(hdl, name, guid, &isactive) == 0 && isactive &&
 		    (zhp = zpool_open_canfail(hdl, name)) != NULL) {
 			if (zpool_get_prop_int(zhp, ZPOOL_PROP_READONLY, NULL))
 				stateval = POOL_STATE_ACTIVE;
 
 			/*
 			 * All we needed the zpool handle for is the
 			 * readonly prop check.
 			 */
 			zpool_close(zhp);
 		}
 
 		ret = B_TRUE;
 		break;
 
 	case POOL_STATE_ACTIVE:
 		/*
 		 * For an active pool, we have to determine if it's really part
 		 * of a currently active pool (in which case the pool will exist
 		 * and the guid will be the same), or whether it's part of an
 		 * active pool that was disconnected without being explicitly
 		 * exported.
 		 */
 		if (pool_active(hdl, name, guid, &isactive) != 0) {
 			nvlist_free(config);
 			return (-1);
 		}
 
 		if (isactive) {
 			/*
 			 * Because the device may have been removed while
 			 * offlined, we only report it as active if the vdev is
 			 * still present in the config.  Otherwise, pretend like
 			 * it's not in use.
 			 */
 			if ((zhp = zpool_open_canfail(hdl, name)) != NULL &&
 			    (pool_config = zpool_get_config(zhp, NULL))
 			    != NULL) {
 				nvlist_t *nvroot;
 
 				verify(nvlist_lookup_nvlist(pool_config,
 				    ZPOOL_CONFIG_VDEV_TREE, &nvroot) == 0);
 				ret = find_guid(nvroot, vdev_guid);
 			} else {
 				ret = B_FALSE;
 			}
 
 			/*
 			 * If this is an active spare within another pool, we
 			 * treat it like an unused hot spare.  This allows the
 			 * user to create a pool with a hot spare that currently
 			 * in use within another pool.  Since we return B_TRUE,
 			 * libdiskmgt will continue to prevent generic consumers
 			 * from using the device.
 			 */
 			if (ret && nvlist_lookup_uint64(config,
 			    ZPOOL_CONFIG_IS_SPARE, &isspare) == 0 && isspare)
 				stateval = POOL_STATE_SPARE;
 
 			if (zhp != NULL)
 				zpool_close(zhp);
 		} else {
 			stateval = POOL_STATE_POTENTIALLY_ACTIVE;
 			ret = B_TRUE;
 		}
 		break;
 
 	case POOL_STATE_SPARE:
 		/*
 		 * For a hot spare, it can be either definitively in use, or
 		 * potentially active.  To determine if it's in use, we iterate
 		 * over all pools in the system and search for one with a spare
 		 * with a matching guid.
 		 *
 		 * Due to the shared nature of spares, we don't actually report
 		 * the potentially active case as in use.  This means the user
 		 * can freely create pools on the hot spares of exported pools,
 		 * but to do otherwise makes the resulting code complicated, and
 		 * we end up having to deal with this case anyway.
 		 */
 		cb.cb_zhp = NULL;
 		cb.cb_guid = vdev_guid;
 		cb.cb_type = ZPOOL_CONFIG_SPARES;
 		if (zpool_iter(hdl, find_aux, &cb) == 1) {
 			name = (char *)zpool_get_name(cb.cb_zhp);
 			ret = B_TRUE;
 		} else {
 			ret = B_FALSE;
 		}
 		break;
 
 	case POOL_STATE_L2CACHE:
 
 		/*
 		 * Check if any pool is currently using this l2cache device.
 		 */
 		cb.cb_zhp = NULL;
 		cb.cb_guid = vdev_guid;
 		cb.cb_type = ZPOOL_CONFIG_L2CACHE;
 		if (zpool_iter(hdl, find_aux, &cb) == 1) {
 			name = (char *)zpool_get_name(cb.cb_zhp);
 			ret = B_TRUE;
 		} else {
 			ret = B_FALSE;
 		}
 		break;
 
 	default:
 		ret = B_FALSE;
 	}
 
 
 	if (ret) {
 		if ((*namestr = zfs_strdup(hdl, name)) == NULL) {
 			if (cb.cb_zhp)
 				zpool_close(cb.cb_zhp);
 			nvlist_free(config);
 			return (-1);
 		}
 		*state = (pool_state_t)stateval;
 	}
 
 	if (cb.cb_zhp)
 		zpool_close(cb.cb_zhp);
 
 	nvlist_free(config);
 	*inuse = ret;
 	return (0);
 }
Index: stable/11/cddl/usr.sbin/zfsd/zfsd_event.cc
===================================================================
--- stable/11/cddl/usr.sbin/zfsd/zfsd_event.cc	(revision 326297)
+++ stable/11/cddl/usr.sbin/zfsd/zfsd_event.cc	(revision 326298)
@@ -1,535 +1,548 @@
 /*-
  * Copyright (c) 2011, 2012, 2013, 2014, 2016 Spectra Logic Corporation
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification.
  * 2. Redistributions in binary form must reproduce at minimum a disclaimer
  *    substantially similar to the "NO WARRANTY" disclaimer below
  *    ("Disclaimer") and any redistribution must be conditioned upon
  *    including a substantially similar Disclaimer requirement for further
  *    binary redistribution.
  *
  * NO WARRANTY
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTIBILITY AND FITNESS FOR
  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  * HOLDERS OR CONTRIBUTORS BE LIABLE FOR SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
  * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  * POSSIBILITY OF SUCH DAMAGES.
  *
  * Authors: Justin T. Gibbs     (Spectra Logic Corporation)
  */
 
 /**
  * \file zfsd_event.cc
  */
 #include <sys/cdefs.h>
 #include <sys/time.h>
 #include <sys/fs/zfs.h>
+#include <sys/vdev_impl.h>
 
 #include <syslog.h>
 
 #include <libzfs.h>
 /* 
  * Undefine flush, defined by cpufunc.h on sparc64, because it conflicts with
  * C++ flush methods
  */
 #undef   flush
 
 #include <list>
 #include <map>
 #include <sstream>
 #include <string>
 
 #include <devdctl/guid.h>
 #include <devdctl/event.h>
 #include <devdctl/event_factory.h>
 #include <devdctl/exception.h>
 #include <devdctl/consumer.h>
 
 #include "callout.h"
 #include "vdev_iterator.h"
 #include "zfsd_event.h"
 #include "case_file.h"
 #include "vdev.h"
 #include "zfsd.h"
 #include "zfsd_exception.h"
 #include "zpool_list.h"
 
 __FBSDID("$FreeBSD$");
 /*============================ Namespace Control =============================*/
 using DevdCtl::Event;
 using DevdCtl::Guid;
 using DevdCtl::NVPairMap;
 using std::stringstream;
 
 /*=========================== Class Implementations ==========================*/
 
 /*-------------------------------- DevfsEvent --------------------------------*/
 
 //- DevfsEvent Static Public Methods -------------------------------------------
 Event *
 DevfsEvent::Builder(Event::Type type,
 		    NVPairMap &nvPairs,
 		    const string &eventString)
 {
 	return (new DevfsEvent(type, nvPairs, eventString));
 }
 
 //- DevfsEvent Static Protected Methods ----------------------------------------
 nvlist_t *
 DevfsEvent::ReadLabel(int devFd, bool &inUse, bool &degraded)
 {
 	pool_state_t poolState;
 	char        *poolName;
 	boolean_t    b_inuse;
+	int          nlabels;
 
 	inUse    = false;
 	degraded = false;
 	poolName = NULL;
 	if (zpool_in_use(g_zfsHandle, devFd, &poolState,
 			 &poolName, &b_inuse) == 0) {
-		nvlist_t *devLabel;
+		nvlist_t *devLabel = NULL;
 
 		inUse = b_inuse == B_TRUE;
 		if (poolName != NULL)
 			free(poolName);
 
-		if (zpool_read_label(devFd, &devLabel) != 0
-		 || devLabel == NULL)
+		nlabels = zpool_read_all_labels(devFd, &devLabel);
+		/*
+		 * If we find a disk with fewer than the maximum number of
+		 * labels, it might be the whole disk of a partitioned disk
+		 * where ZFS resides on a partition.  In that case, we should do
+		 * nothing and wait for the partition to appear.  Or, the disk
+		 * might be damaged.  In that case, zfsd should do nothing and
+		 * wait for the sysadmin to decide.
+		 */
+		if (nlabels != VDEV_LABELS || devLabel == NULL) {
+			nvlist_free(devLabel);
 			return (NULL);
+		}
 
 		try {
 			Vdev vdev(devLabel);
 			degraded = vdev.State() != VDEV_STATE_HEALTHY;
 			return (devLabel);
 		} catch (ZfsdException &exp) {
 			string devName = fdevname(devFd);
 			string devPath = _PATH_DEV + devName;
 			string context("DevfsEvent::ReadLabel: "
 				     + devPath + ": ");
 
 			exp.GetString().insert(0, context);
 			exp.Log();
+			nvlist_free(devLabel);
 		}
 	}
 	return (NULL);
 }
 
 bool
 DevfsEvent::OnlineByLabel(const string &devPath, const string& physPath,
 			      nvlist_t *devConfig)
 {
 	try {
 		/*
 		 * A device with ZFS label information has been
 		 * inserted.  If it matches a device for which we
 		 * have a case, see if we can solve that case.
 		 */
 		syslog(LOG_INFO, "Interrogating VDEV label for %s\n",
 		       devPath.c_str());
 		Vdev vdev(devConfig);
 		CaseFile *caseFile(CaseFile::Find(vdev.PoolGUID(),
 						  vdev.GUID()));
 		if (caseFile != NULL)
 			return (caseFile->ReEvaluate(devPath, physPath, &vdev));
 
 	} catch (ZfsdException &exp) {
 		string context("DevfsEvent::OnlineByLabel: " + devPath + ": ");
 
 		exp.GetString().insert(0, context);
 		exp.Log();
 	}
 	return (false);
 }
 
 //- DevfsEvent Virtual Public Methods ------------------------------------------
 Event *
 DevfsEvent::DeepCopy() const
 {
 	return (new DevfsEvent(*this));
 }
 
 bool
 DevfsEvent::Process() const
 {
 	/*
 	 * We are only concerned with newly discovered
 	 * devices that can be ZFS vdevs.
 	 */
 	if (Value("type") != "CREATE" || !IsDiskDev())
 		return (false);
 
 	/* Log the event since it is of interest. */
 	Log(LOG_INFO);
 
 	string devPath;
 	if (!DevPath(devPath))
 		return (false);
 
 	int devFd(open(devPath.c_str(), O_RDONLY));
 	if (devFd == -1)
 		return (false);
 
 	bool inUse;
 	bool degraded;
 	nvlist_t *devLabel(ReadLabel(devFd, inUse, degraded));
 
 	string physPath;
 	bool havePhysPath(PhysicalPath(physPath));
 
 	string devName;
 	DevName(devName);
 	close(devFd);
 
 	if (inUse && devLabel != NULL) {
 		OnlineByLabel(devPath, physPath, devLabel);
 	} else if (degraded) {
 		syslog(LOG_INFO, "%s is marked degraded.  Ignoring "
 		       "as a replace by physical path candidate.\n",
 		       devName.c_str());
 	} else if (havePhysPath && IsWholeDev()) {
 		/*
 		 * TODO: attempt to resolve events using every casefile
 		 * that matches this physpath
 		 */
 		CaseFile *caseFile(CaseFile::Find(physPath));
 		if (caseFile != NULL) {
 			syslog(LOG_INFO,
 			       "Found CaseFile(%s:%s:%s) - ReEvaluating\n",
 			       caseFile->PoolGUIDString().c_str(),
 			       caseFile->VdevGUIDString().c_str(),
 			       zpool_state_to_name(caseFile->VdevState(),
 						   VDEV_AUX_NONE));
 			caseFile->ReEvaluate(devPath, physPath, /*vdev*/NULL);
 		}
 	}
 	if (devLabel != NULL)
 		nvlist_free(devLabel);
 	return (false);
 }
 
 //- DevfsEvent Protected Methods -----------------------------------------------
 DevfsEvent::DevfsEvent(Event::Type type, NVPairMap &nvpairs,
 			       const string &eventString)
  : DevdCtl::DevfsEvent(type, nvpairs, eventString)
 {
 }
 
 DevfsEvent::DevfsEvent(const DevfsEvent &src)
  : DevdCtl::DevfsEvent::DevfsEvent(src)
 {
 }
 
 /*-------------------------------- GeomEvent --------------------------------*/
 
 //- GeomEvent Static Public Methods -------------------------------------------
 Event *
 GeomEvent::Builder(Event::Type type,
 		   NVPairMap &nvPairs,
 		   const string &eventString)
 {
 	return (new GeomEvent(type, nvPairs, eventString));
 }
 
 //- GeomEvent Virtual Public Methods ------------------------------------------
 Event *
 GeomEvent::DeepCopy() const
 {
 	return (new GeomEvent(*this));
 }
  
 bool
 GeomEvent::Process() const
 {
 	/*
 	 * We are only concerned with physical path changes, because those can
 	 * be used to satisfy autoreplace operations
 	 */
 	if (Value("type") != "GEOM::physpath" || !IsDiskDev())
 		return (false);
 
 	/* Log the event since it is of interest. */
 	Log(LOG_INFO);
 
 	string devPath;
 	if (!DevPath(devPath))
 		return (false);
 
 	string physPath;
         bool havePhysPath(PhysicalPath(physPath));
 
 	string devName;
 	DevName(devName);
 
 	if (havePhysPath) {
 		/* 
 		 * TODO: attempt to resolve events using every casefile
 		 * that matches this physpath
 		 */
 		CaseFile *caseFile(CaseFile::Find(physPath));
 		if (caseFile != NULL) {
 			syslog(LOG_INFO,
 			       "Found CaseFile(%s:%s:%s) - ReEvaluating\n",
 			       caseFile->PoolGUIDString().c_str(),
 			       caseFile->VdevGUIDString().c_str(),
 			       zpool_state_to_name(caseFile->VdevState(),
 						   VDEV_AUX_NONE));
 			caseFile->ReEvaluate(devPath, physPath, /*vdev*/NULL);
 		}
 	}
 	return (false);
 }
 
 //- GeomEvent Protected Methods -----------------------------------------------
 GeomEvent::GeomEvent(Event::Type type, NVPairMap &nvpairs,
 			       const string &eventString)
  : DevdCtl::GeomEvent(type, nvpairs, eventString)
 {
 }
 
 GeomEvent::GeomEvent(const GeomEvent &src)
  : DevdCtl::GeomEvent::GeomEvent(src)
 {
 }
 
 
 /*--------------------------------- ZfsEvent ---------------------------------*/
 //- ZfsEvent Static Public Methods ---------------------------------------------
 DevdCtl::Event *
 ZfsEvent::Builder(Event::Type type, NVPairMap &nvpairs,
 		  const string &eventString)
 {
 	return (new ZfsEvent(type, nvpairs, eventString));
 }
 
 //- ZfsEvent Virtual Public Methods --------------------------------------------
 Event *
 ZfsEvent::DeepCopy() const
 {
 	return (new ZfsEvent(*this));
 }
 
 bool
 ZfsEvent::Process() const
 {
 	string logstr("");
 
 	if (!Contains("class") && !Contains("type")) {
 		syslog(LOG_ERR,
 		       "ZfsEvent::Process: Missing class or type data.");
 		return (false);
 	}
 
 	/* On config syncs, replay any queued events first. */
 	if (Value("type").find("misc.fs.zfs.config_sync") == 0) {
 		/*
 		 * Even if saved events are unconsumed the second time
 		 * around, drop them.  Any events that still can't be
 		 * consumed are probably referring to vdevs or pools that
 		 * no longer exist.
 		 */
 		ZfsDaemon::Get().ReplayUnconsumedEvents(/*discard*/true);
 		CaseFile::ReEvaluateByGuid(PoolGUID(), *this);
 	}
 
 	if (Value("type").find("misc.fs.zfs.") == 0) {
 		/* Configuration changes, resilver events, etc. */
 		ProcessPoolEvent();
 		return (false);
 	}
 
 	if (!Contains("pool_guid") || !Contains("vdev_guid")) {
 		/* Only currently interested in Vdev related events. */
 		return (false);
 	}
 
 	CaseFile *caseFile(CaseFile::Find(PoolGUID(), VdevGUID()));
 	if (caseFile != NULL) {
 		Log(LOG_INFO);
 		syslog(LOG_INFO, "Evaluating existing case file\n");
 		caseFile->ReEvaluate(*this);
 		return (false);
 	}
 
 	/* Skip events that can't be handled. */
 	Guid poolGUID(PoolGUID());
 	/* If there are no replicas for a pool, then it's not manageable. */
 	if (Value("class").find("fs.zfs.vdev.no_replicas") == 0) {
 		stringstream msg;
 		msg << "No replicas available for pool "  << poolGUID;
 		msg << ", ignoring";
 		Log(LOG_INFO);
 		syslog(LOG_INFO, "%s", msg.str().c_str());
 		return (false);
 	}
 
 	/*
 	 * Create a case file for this vdev, and have it
 	 * evaluate the event.
 	 */
 	ZpoolList zpl(ZpoolList::ZpoolByGUID, &poolGUID);
 	if (zpl.empty()) {
 		stringstream msg;
 		int priority = LOG_INFO;
 		msg << "ZfsEvent::Process: Event for unknown pool ";
 		msg << poolGUID << " ";
 		msg << "queued";
 		Log(LOG_INFO);
 		syslog(priority, "%s", msg.str().c_str());
 		return (true);
 	}
 
 	nvlist_t *vdevConfig = VdevIterator(zpl.front()).Find(VdevGUID());
 	if (vdevConfig == NULL) {
 		stringstream msg;
 		int priority = LOG_INFO;
 		msg << "ZfsEvent::Process: Event for unknown vdev ";
 		msg << VdevGUID() << " ";
 		msg << "queued";
 		Log(LOG_INFO);
 		syslog(priority, "%s", msg.str().c_str());
 		return (true);
 	}
 
 	Vdev vdev(zpl.front(), vdevConfig);
 	caseFile = &CaseFile::Create(vdev);
 	if (caseFile->ReEvaluate(*this) == false) {
 		stringstream msg;
 		int priority = LOG_INFO;
 		msg << "ZfsEvent::Process: Unconsumed event for vdev(";
 		msg << zpool_get_name(zpl.front()) << ",";
 		msg << vdev.GUID() << ") ";
 		msg << "queued";
 		Log(LOG_INFO);
 		syslog(priority, "%s", msg.str().c_str());
 		return (true);
 	}
 	return (false);
 }
 
 //- ZfsEvent Protected Methods -------------------------------------------------
 ZfsEvent::ZfsEvent(Event::Type type, NVPairMap &nvpairs,
 			   const string &eventString)
  : DevdCtl::ZfsEvent(type, nvpairs, eventString)
 {
 }
 
 ZfsEvent::ZfsEvent(const ZfsEvent &src)
  : DevdCtl::ZfsEvent(src)
 {
 }
 
 /*
  * Sometimes the kernel won't detach a spare when it is no longer needed.  This
  * can happen for example if a drive is removed, then either the pool is
  * exported or the machine is powered off, then the drive is reinserted, then
  * the machine is powered on or the pool is imported.  ZFSD must detach these
  * spares itself.
  */
 void
 ZfsEvent::CleanupSpares() const
 {
 	Guid poolGUID(PoolGUID());
 	ZpoolList zpl(ZpoolList::ZpoolByGUID, &poolGUID);
 	if (!zpl.empty()) {
 		zpool_handle_t* hdl;
 
 		hdl = zpl.front();
 		VdevIterator(hdl).Each(TryDetach, (void*)hdl);
 	}
 }
 
 void
 ZfsEvent::ProcessPoolEvent() const
 {
 	bool degradedDevice(false);
 
 	/* The pool is destroyed.  Discard any open cases */
 	if (Value("type") == "misc.fs.zfs.pool_destroy") {
 		Log(LOG_INFO);
 		CaseFile::ReEvaluateByGuid(PoolGUID(), *this);
 		return;
 	}
 
 	CaseFile *caseFile(CaseFile::Find(PoolGUID(), VdevGUID()));
 	if (caseFile != NULL) {
 		if (caseFile->VdevState() != VDEV_STATE_UNKNOWN
 		 && caseFile->VdevState() < VDEV_STATE_HEALTHY)
 			degradedDevice = true;
 
 		Log(LOG_INFO);
 		caseFile->ReEvaluate(*this);
 	}
 	else if (Value("type") == "misc.fs.zfs.resilver_finish")
 	{
 		/*
 		 * It's possible to get a resilver_finish event with no
 		 * corresponding casefile.  For example, if a damaged pool were
 		 * exported, repaired, then reimported.
 		 */
 		Log(LOG_INFO);
 		CleanupSpares();
 	}
 
 	if (Value("type") == "misc.fs.zfs.vdev_remove"
 	 && degradedDevice == false) {
 
 		/* See if any other cases can make use of this device. */
 		Log(LOG_INFO);
 		ZfsDaemon::RequestSystemRescan();
 	}
 }
 
 bool
 ZfsEvent::TryDetach(Vdev &vdev, void *cbArg)
 {
 	/*
 	 * Outline:
 	 * if this device is a spare, and its parent includes one healthy,
 	 * non-spare child, then detach this device.
 	 */
 	zpool_handle_t *hdl(static_cast<zpool_handle_t*>(cbArg));
 
 	if (vdev.IsSpare()) {
 		std::list<Vdev> siblings;
 		std::list<Vdev>::iterator siblings_it;
 		boolean_t cleanup = B_FALSE;
 
 		Vdev parent = vdev.Parent();
 		siblings = parent.Children();
 
 		/* Determine whether the parent should be cleaned up */
 		for (siblings_it = siblings.begin();
 		     siblings_it != siblings.end();
 		     siblings_it++) {
 			Vdev sibling = *siblings_it;
 
 			if (!sibling.IsSpare() &&
 			     sibling.State() == VDEV_STATE_HEALTHY) {
 				cleanup = B_TRUE;
 				break;
 			}
 		}
 
 		if (cleanup) {
 			syslog(LOG_INFO, "Detaching spare vdev %s from pool %s",
 			       vdev.Path().c_str(), zpool_get_name(hdl));
 			zpool_vdev_detach(hdl, vdev.Path().c_str());
 		}
 
 	}
 
 	/* Always return false, because there may be other spares to detach */
 	return (false);
 }
Index: stable/11
===================================================================
--- stable/11	(revision 326297)
+++ stable/11	(revision 326298)

Property changes on: stable/11
___________________________________________________________________
Modified: svn:mergeinfo
## -0,0 +0,1 ##
   Merged /head:r322854,323995,324568,324991