diff --git a/include/sys/abd.h b/include/sys/abd.h
index 3a500e2c9ae7..19fe96292d5f 100644
--- a/include/sys/abd.h
+++ b/include/sys/abd.h
@@ -1,233 +1,235 @@
 /*
  * CDDL HEADER START
  *
  * The contents of this file are subject to the terms of the
  * Common Development and Distribution License (the "License").
  * You may not use this file except in compliance with the License.
  *
  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  * or https://opensource.org/licenses/CDDL-1.0.
  * See the License for the specific language governing permissions
  * and limitations under the License.
  *
  * When distributing Covered Code, include this CDDL HEADER in each
  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  * If applicable, add the following below this CDDL HEADER, with the
  * fields enclosed by brackets "[]" replaced with your own identifying
  * information: Portions Copyright [yyyy] [name of copyright owner]
  *
  * CDDL HEADER END
  */
 /*
  * Copyright (c) 2014 by Chunwei Chen. All rights reserved.
  * Copyright (c) 2016, 2019 by Delphix. All rights reserved.
  */
 
 #ifndef _ABD_H
 #define	_ABD_H
 
 #include <sys/isa_defs.h>
 #include <sys/debug.h>
 #include <sys/zfs_refcount.h>
 #include <sys/uio.h>
 
 #ifdef __cplusplus
 extern "C" {
 #endif
 
 typedef enum abd_flags {
 	ABD_FLAG_LINEAR		= 1 << 0, /* is buffer linear (or scattered)? */
 	ABD_FLAG_OWNER		= 1 << 1, /* does it own its data buffers? */
 	ABD_FLAG_META		= 1 << 2, /* does this represent FS metadata? */
 	ABD_FLAG_MULTI_ZONE  	= 1 << 3, /* pages split over memory zones */
 	ABD_FLAG_MULTI_CHUNK 	= 1 << 4, /* pages split over multiple chunks */
 	ABD_FLAG_LINEAR_PAGE 	= 1 << 5, /* linear but allocd from page */
 	ABD_FLAG_GANG		= 1 << 6, /* mult ABDs chained together */
 	ABD_FLAG_GANG_FREE	= 1 << 7, /* gang ABD is responsible for mem */
 	ABD_FLAG_ZEROS		= 1 << 8, /* ABD for zero-filled buffer */
 	ABD_FLAG_ALLOCD		= 1 << 9, /* we allocated the abd_t */
 } abd_flags_t;
 
 typedef struct abd {
 	abd_flags_t	abd_flags;
 	uint_t		abd_size;	/* excludes scattered abd_offset */
 	list_node_t	abd_gang_link;
 #ifdef ZFS_DEBUG
 	struct abd	*abd_parent;
 	zfs_refcount_t	abd_children;
 #endif
 	kmutex_t	abd_mtx;
 	union {
 		struct abd_scatter {
 			uint_t		abd_offset;
 #if defined(__FreeBSD__) && defined(_KERNEL)
 			void    *abd_chunks[1]; /* actually variable-length */
 #else
 			uint_t		abd_nents;
 			struct scatterlist *abd_sgl;
 #endif
 		} abd_scatter;
 		struct abd_linear {
 			void		*abd_buf;
 			struct scatterlist *abd_sgl; /* for LINEAR_PAGE */
 		} abd_linear;
 		struct abd_gang {
 			list_t abd_gang_chain;
 		} abd_gang;
 	} abd_u;
 } abd_t;
 
 typedef int abd_iter_func_t(void *buf, size_t len, void *priv);
 typedef int abd_iter_func2_t(void *bufa, void *bufb, size_t len, void *priv);
 #if defined(__linux__) && defined(_KERNEL)
 typedef int abd_iter_page_func_t(struct page *, size_t, size_t, void *);
 #endif
 
 extern int zfs_abd_scatter_enabled;
 
 /*
  * Allocations and deallocations
  */
 
 __attribute__((malloc))
 abd_t *abd_alloc(size_t, boolean_t);
 __attribute__((malloc))
 abd_t *abd_alloc_linear(size_t, boolean_t);
 __attribute__((malloc))
 abd_t *abd_alloc_gang(void);
 __attribute__((malloc))
 abd_t *abd_alloc_for_io(size_t, boolean_t);
 __attribute__((malloc))
 abd_t *abd_alloc_sametype(abd_t *, size_t);
 boolean_t abd_size_alloc_linear(size_t);
 void abd_gang_add(abd_t *, abd_t *, boolean_t);
 void abd_free(abd_t *);
 abd_t *abd_get_offset(abd_t *, size_t);
 abd_t *abd_get_offset_size(abd_t *, size_t, size_t);
 abd_t *abd_get_offset_struct(abd_t *, abd_t *, size_t, size_t);
 abd_t *abd_get_zeros(size_t);
 abd_t *abd_get_from_buf(void *, size_t);
 void abd_cache_reap_now(void);
 
 /*
  * Conversion to and from a normal buffer
  */
 
 void *abd_to_buf(abd_t *);
 void *abd_borrow_buf(abd_t *, size_t);
 void *abd_borrow_buf_copy(abd_t *, size_t);
 void abd_return_buf(abd_t *, void *, size_t);
 void abd_return_buf_copy(abd_t *, void *, size_t);
 void abd_take_ownership_of_buf(abd_t *, boolean_t);
 void abd_release_ownership_of_buf(abd_t *);
 
 /*
  * ABD operations
  */
 
 int abd_iterate_func(abd_t *, size_t, size_t, abd_iter_func_t *, void *);
 int abd_iterate_func2(abd_t *, abd_t *, size_t, size_t, size_t,
     abd_iter_func2_t *, void *);
 #if defined(__linux__) && defined(_KERNEL)
 int abd_iterate_page_func(abd_t *, size_t, size_t, abd_iter_page_func_t *,
     void *);
 #endif
 void abd_copy_off(abd_t *, abd_t *, size_t, size_t, size_t);
 void abd_copy_from_buf_off(abd_t *, const void *, size_t, size_t);
 void abd_copy_to_buf_off(void *, abd_t *, size_t, size_t);
 int abd_cmp(abd_t *, abd_t *);
 int abd_cmp_buf_off(abd_t *, const void *, size_t, size_t);
 void abd_zero_off(abd_t *, size_t, size_t);
 void abd_verify(abd_t *);
 
 void abd_raidz_gen_iterate(abd_t **cabds, abd_t *dabd, size_t off,
 	size_t csize, size_t dsize, const unsigned parity,
 	void (*func_raidz_gen)(void **, const void *, size_t, size_t));
 void abd_raidz_rec_iterate(abd_t **cabds, abd_t **tabds,
 	size_t tsize, const unsigned parity,
 	void (*func_raidz_rec)(void **t, const size_t tsize, void **c,
 	const unsigned *mul),
 	const unsigned *mul);
 
 /*
  * Wrappers for calls with offsets of 0
  */
 
 static inline void
 abd_copy(abd_t *dabd, abd_t *sabd, size_t size)
 {
 	abd_copy_off(dabd, sabd, 0, 0, size);
 }
 
 static inline void
 abd_copy_from_buf(abd_t *abd, const void *buf, size_t size)
 {
 	abd_copy_from_buf_off(abd, buf, 0, size);
 }
 
 static inline void
 abd_copy_to_buf(void* buf, abd_t *abd, size_t size)
 {
 	abd_copy_to_buf_off(buf, abd, 0, size);
 }
 
 static inline int
 abd_cmp_buf(abd_t *abd, const void *buf, size_t size)
 {
 	return (abd_cmp_buf_off(abd, buf, 0, size));
 }
 
 static inline void
 abd_zero(abd_t *abd, size_t size)
 {
 	abd_zero_off(abd, 0, size);
 }
 
 /*
  * ABD type check functions
  */
 static inline boolean_t
 abd_is_linear(abd_t *abd)
 {
 	return ((abd->abd_flags & ABD_FLAG_LINEAR) ? B_TRUE : B_FALSE);
 }
 
 static inline boolean_t
 abd_is_linear_page(abd_t *abd)
 {
 	return ((abd->abd_flags & ABD_FLAG_LINEAR_PAGE) ? B_TRUE : B_FALSE);
 }
 
 static inline boolean_t
 abd_is_gang(abd_t *abd)
 {
 	return ((abd->abd_flags & ABD_FLAG_GANG) ? B_TRUE : B_FALSE);
 }
 
 static inline uint_t
 abd_get_size(abd_t *abd)
 {
 	return (abd->abd_size);
 }
 
 /*
  * Module lifecycle
  * Defined in each specific OS's abd_os.c
  */
 
 void abd_init(void);
 void abd_fini(void);
 
 /*
  * Linux ABD bio functions
+ * Note: these are only needed to support vdev_classic. See comment in
+ * vdev_disk.c.
  */
 #if defined(__linux__) && defined(_KERNEL)
 unsigned int abd_bio_map_off(struct bio *, abd_t *, unsigned int, size_t);
 unsigned long abd_nr_pages_off(abd_t *, unsigned int, size_t);
 #endif
 
 #ifdef __cplusplus
 }
 #endif
 
 #endif	/* _ABD_H */
diff --git a/module/os/linux/zfs/abd_os.c b/module/os/linux/zfs/abd_os.c
index dae1280121da..3fe01c0b7d77 100644
--- a/module/os/linux/zfs/abd_os.c
+++ b/module/os/linux/zfs/abd_os.c
@@ -1,1254 +1,1259 @@
 /*
  * CDDL HEADER START
  *
  * The contents of this file are subject to the terms of the
  * Common Development and Distribution License (the "License").
  * You may not use this file except in compliance with the License.
  *
  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  * or https://opensource.org/licenses/CDDL-1.0.
  * See the License for the specific language governing permissions
  * and limitations under the License.
  *
  * When distributing Covered Code, include this CDDL HEADER in each
  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  * If applicable, add the following below this CDDL HEADER, with the
  * fields enclosed by brackets "[]" replaced with your own identifying
  * information: Portions Copyright [yyyy] [name of copyright owner]
  *
  * CDDL HEADER END
  */
 /*
  * Copyright (c) 2014 by Chunwei Chen. All rights reserved.
  * Copyright (c) 2019 by Delphix. All rights reserved.
  * Copyright (c) 2023, 2024, Klara Inc.
  */
 
 /*
  * See abd.c for a general overview of the arc buffered data (ABD).
  *
  * Linear buffers act exactly like normal buffers and are always mapped into the
  * kernel's virtual memory space, while scattered ABD data chunks are allocated
  * as physical pages and then mapped in only while they are actually being
  * accessed through one of the abd_* library functions. Using scattered ABDs
  * provides several benefits:
  *
  *  (1) They avoid use of kmem_*, preventing performance problems where running
  *      kmem_reap on very large memory systems never finishes and causes
  *      constant TLB shootdowns.
  *
  *  (2) Fragmentation is less of an issue since when we are at the limit of
  *      allocatable space, we won't have to search around for a long free
  *      hole in the VA space for large ARC allocations. Each chunk is mapped in
  *      individually, so even if we are using HIGHMEM (see next point) we
  *      wouldn't need to worry about finding a contiguous address range.
  *
  *  (3) If we are not using HIGHMEM, then all physical memory is always
  *      mapped into the kernel's address space, so we also avoid the map /
  *      unmap costs on each ABD access.
  *
  * If we are not using HIGHMEM, scattered buffers which have only one chunk
  * can be treated as linear buffers, because they are contiguous in the
  * kernel's virtual address space.  See abd_alloc_chunks() for details.
  */
 
 #include <sys/abd_impl.h>
 #include <sys/param.h>
 #include <sys/zio.h>
 #include <sys/arc.h>
 #include <sys/zfs_context.h>
 #include <sys/zfs_znode.h>
 #ifdef _KERNEL
 #include <linux/kmap_compat.h>
 #include <linux/mm_compat.h>
 #include <linux/scatterlist.h>
 #endif
 
 #ifdef _KERNEL
 #if defined(MAX_ORDER)
 #define	ABD_MAX_ORDER	(MAX_ORDER)
 #elif defined(MAX_PAGE_ORDER)
 #define	ABD_MAX_ORDER	(MAX_PAGE_ORDER)
 #endif
 #else
 #define	ABD_MAX_ORDER	(1)
 #endif
 
 typedef struct abd_stats {
 	kstat_named_t abdstat_struct_size;
 	kstat_named_t abdstat_linear_cnt;
 	kstat_named_t abdstat_linear_data_size;
 	kstat_named_t abdstat_scatter_cnt;
 	kstat_named_t abdstat_scatter_data_size;
 	kstat_named_t abdstat_scatter_chunk_waste;
 	kstat_named_t abdstat_scatter_orders[ABD_MAX_ORDER];
 	kstat_named_t abdstat_scatter_page_multi_chunk;
 	kstat_named_t abdstat_scatter_page_multi_zone;
 	kstat_named_t abdstat_scatter_page_alloc_retry;
 	kstat_named_t abdstat_scatter_sg_table_retry;
 } abd_stats_t;
 
 static abd_stats_t abd_stats = {
 	/* Amount of memory occupied by all of the abd_t struct allocations */
 	{ "struct_size",			KSTAT_DATA_UINT64 },
 	/*
 	 * The number of linear ABDs which are currently allocated, excluding
 	 * ABDs which don't own their data (for instance the ones which were
 	 * allocated through abd_get_offset() and abd_get_from_buf()). If an
 	 * ABD takes ownership of its buf then it will become tracked.
 	 */
 	{ "linear_cnt",				KSTAT_DATA_UINT64 },
 	/* Amount of data stored in all linear ABDs tracked by linear_cnt */
 	{ "linear_data_size",			KSTAT_DATA_UINT64 },
 	/*
 	 * The number of scatter ABDs which are currently allocated, excluding
 	 * ABDs which don't own their data (for instance the ones which were
 	 * allocated through abd_get_offset()).
 	 */
 	{ "scatter_cnt",			KSTAT_DATA_UINT64 },
 	/* Amount of data stored in all scatter ABDs tracked by scatter_cnt */
 	{ "scatter_data_size",			KSTAT_DATA_UINT64 },
 	/*
 	 * The amount of space wasted at the end of the last chunk across all
 	 * scatter ABDs tracked by scatter_cnt.
 	 */
 	{ "scatter_chunk_waste",		KSTAT_DATA_UINT64 },
 	/*
 	 * The number of compound allocations of a given order.  These
 	 * allocations are spread over all currently allocated ABDs, and
 	 * act as a measure of memory fragmentation.
 	 */
 	{ { "scatter_order_N",			KSTAT_DATA_UINT64 } },
 	/*
 	 * The number of scatter ABDs which contain multiple chunks.
 	 * ABDs are preferentially allocated from the minimum number of
 	 * contiguous multi-page chunks, a single chunk is optimal.
 	 */
 	{ "scatter_page_multi_chunk",		KSTAT_DATA_UINT64 },
 	/*
 	 * The number of scatter ABDs which are split across memory zones.
 	 * ABDs are preferentially allocated using pages from a single zone.
 	 */
 	{ "scatter_page_multi_zone",		KSTAT_DATA_UINT64 },
 	/*
 	 *  The total number of retries encountered when attempting to
 	 *  allocate the pages to populate the scatter ABD.
 	 */
 	{ "scatter_page_alloc_retry",		KSTAT_DATA_UINT64 },
 	/*
 	 *  The total number of retries encountered when attempting to
 	 *  allocate the sg table for an ABD.
 	 */
 	{ "scatter_sg_table_retry",		KSTAT_DATA_UINT64 },
 };
 
 static struct {
 	wmsum_t abdstat_struct_size;
 	wmsum_t abdstat_linear_cnt;
 	wmsum_t abdstat_linear_data_size;
 	wmsum_t abdstat_scatter_cnt;
 	wmsum_t abdstat_scatter_data_size;
 	wmsum_t abdstat_scatter_chunk_waste;
 	wmsum_t abdstat_scatter_orders[ABD_MAX_ORDER];
 	wmsum_t abdstat_scatter_page_multi_chunk;
 	wmsum_t abdstat_scatter_page_multi_zone;
 	wmsum_t abdstat_scatter_page_alloc_retry;
 	wmsum_t abdstat_scatter_sg_table_retry;
 } abd_sums;
 
 #define	abd_for_each_sg(abd, sg, n, i)	\
 	for_each_sg(ABD_SCATTER(abd).abd_sgl, sg, n, i)
 
 /*
  * zfs_abd_scatter_min_size is the minimum allocation size to use scatter
  * ABD's.  Smaller allocations will use linear ABD's which uses
  * zio_[data_]buf_alloc().
  *
  * Scatter ABD's use at least one page each, so sub-page allocations waste
  * some space when allocated as scatter (e.g. 2KB scatter allocation wastes
  * half of each page).  Using linear ABD's for small allocations means that
  * they will be put on slabs which contain many allocations.  This can
  * improve memory efficiency, but it also makes it much harder for ARC
  * evictions to actually free pages, because all the buffers on one slab need
  * to be freed in order for the slab (and underlying pages) to be freed.
  * Typically, 512B and 1KB kmem caches have 16 buffers per slab, so it's
  * possible for them to actually waste more memory than scatter (one page per
  * buf = wasting 3/4 or 7/8th; one buf per slab = wasting 15/16th).
  *
  * Spill blocks are typically 512B and are heavily used on systems running
  * selinux with the default dnode size and the `xattr=sa` property set.
  *
  * By default we use linear allocations for 512B and 1KB, and scatter
  * allocations for larger (1.5KB and up).
  */
 static int zfs_abd_scatter_min_size = 512 * 3;
 
 /*
  * We use a scattered SPA_MAXBLOCKSIZE sized ABD whose pages are
  * just a single zero'd page. This allows us to conserve memory by
  * only using a single zero page for the scatterlist.
  */
 abd_t *abd_zero_scatter = NULL;
 
 struct page;
 /*
  * _KERNEL   - Will point to ZERO_PAGE if it is available or it will be
  *             an allocated zero'd PAGESIZE buffer.
  * Userspace - Will be an allocated zero'ed PAGESIZE buffer.
  *
  * abd_zero_page is assigned to each of the pages of abd_zero_scatter.
  */
 static struct page *abd_zero_page = NULL;
 
 static kmem_cache_t *abd_cache = NULL;
 static kstat_t *abd_ksp;
 
 static uint_t
 abd_chunkcnt_for_bytes(size_t size)
 {
 	return (P2ROUNDUP(size, PAGESIZE) / PAGESIZE);
 }
 
 abd_t *
 abd_alloc_struct_impl(size_t size)
 {
 	/*
 	 * In Linux we do not use the size passed in during ABD
 	 * allocation, so we just ignore it.
 	 */
 	(void) size;
 	abd_t *abd = kmem_cache_alloc(abd_cache, KM_PUSHPAGE);
 	ASSERT3P(abd, !=, NULL);
 	ABDSTAT_INCR(abdstat_struct_size, sizeof (abd_t));
 
 	return (abd);
 }
 
 void
 abd_free_struct_impl(abd_t *abd)
 {
 	kmem_cache_free(abd_cache, abd);
 	ABDSTAT_INCR(abdstat_struct_size, -(int)sizeof (abd_t));
 }
 
 #ifdef _KERNEL
 static unsigned zfs_abd_scatter_max_order = ABD_MAX_ORDER - 1;
 
 /*
  * Mark zfs data pages so they can be excluded from kernel crash dumps
  */
 #ifdef _LP64
 #define	ABD_FILE_CACHE_PAGE	0x2F5ABDF11ECAC4E
 
 static inline void
 abd_mark_zfs_page(struct page *page)
 {
 	get_page(page);
 	SetPagePrivate(page);
 	set_page_private(page, ABD_FILE_CACHE_PAGE);
 }
 
 static inline void
 abd_unmark_zfs_page(struct page *page)
 {
 	set_page_private(page, 0UL);
 	ClearPagePrivate(page);
 	put_page(page);
 }
 #else
 #define	abd_mark_zfs_page(page)
 #define	abd_unmark_zfs_page(page)
 #endif /* _LP64 */
 
 #ifndef CONFIG_HIGHMEM
 
 #ifndef __GFP_RECLAIM
 #define	__GFP_RECLAIM		__GFP_WAIT
 #endif
 
 /*
  * The goal is to minimize fragmentation by preferentially populating ABDs
  * with higher order compound pages from a single zone.  Allocation size is
  * progressively decreased until it can be satisfied without performing
  * reclaim or compaction.  When necessary this function will degenerate to
  * allocating individual pages and allowing reclaim to satisfy allocations.
  */
 void
 abd_alloc_chunks(abd_t *abd, size_t size)
 {
 	struct list_head pages;
 	struct sg_table table;
 	struct scatterlist *sg;
 	struct page *page, *tmp_page = NULL;
 	gfp_t gfp = __GFP_NOWARN | GFP_NOIO;
 	gfp_t gfp_comp = (gfp | __GFP_NORETRY | __GFP_COMP) & ~__GFP_RECLAIM;
 	unsigned int max_order = MIN(zfs_abd_scatter_max_order,
 	    ABD_MAX_ORDER - 1);
 	unsigned int nr_pages = abd_chunkcnt_for_bytes(size);
 	unsigned int chunks = 0, zones = 0;
 	size_t remaining_size;
 	int nid = NUMA_NO_NODE;
 	unsigned int alloc_pages = 0;
 
 	INIT_LIST_HEAD(&pages);
 
 	ASSERT3U(alloc_pages, <, nr_pages);
 
 	while (alloc_pages < nr_pages) {
 		unsigned int chunk_pages;
 		unsigned int order;
 
 		order = MIN(highbit64(nr_pages - alloc_pages) - 1, max_order);
 		chunk_pages = (1U << order);
 
 		page = alloc_pages_node(nid, order ? gfp_comp : gfp, order);
 		if (page == NULL) {
 			if (order == 0) {
 				ABDSTAT_BUMP(abdstat_scatter_page_alloc_retry);
 				schedule_timeout_interruptible(1);
 			} else {
 				max_order = MAX(0, order - 1);
 			}
 			continue;
 		}
 
 		list_add_tail(&page->lru, &pages);
 
 		if ((nid != NUMA_NO_NODE) && (page_to_nid(page) != nid))
 			zones++;
 
 		nid = page_to_nid(page);
 		ABDSTAT_BUMP(abdstat_scatter_orders[order]);
 		chunks++;
 		alloc_pages += chunk_pages;
 	}
 
 	ASSERT3S(alloc_pages, ==, nr_pages);
 
 	while (sg_alloc_table(&table, chunks, gfp)) {
 		ABDSTAT_BUMP(abdstat_scatter_sg_table_retry);
 		schedule_timeout_interruptible(1);
 	}
 
 	sg = table.sgl;
 	remaining_size = size;
 	list_for_each_entry_safe(page, tmp_page, &pages, lru) {
 		size_t sg_size = MIN(PAGESIZE << compound_order(page),
 		    remaining_size);
 		sg_set_page(sg, page, sg_size, 0);
 		abd_mark_zfs_page(page);
 		remaining_size -= sg_size;
 
 		sg = sg_next(sg);
 		list_del(&page->lru);
 	}
 
 	/*
 	 * These conditions ensure that a possible transformation to a linear
 	 * ABD would be valid.
 	 */
 	ASSERT(!PageHighMem(sg_page(table.sgl)));
 	ASSERT0(ABD_SCATTER(abd).abd_offset);
 
 	if (table.nents == 1) {
 		/*
 		 * Since there is only one entry, this ABD can be represented
 		 * as a linear buffer.  All single-page (4K) ABD's can be
 		 * represented this way.  Some multi-page ABD's can also be
 		 * represented this way, if we were able to allocate a single
 		 * "chunk" (higher-order "page" which represents a power-of-2
 		 * series of physically-contiguous pages).  This is often the
 		 * case for 2-page (8K) ABD's.
 		 *
 		 * Representing a single-entry scatter ABD as a linear ABD
 		 * has the performance advantage of avoiding the copy (and
 		 * allocation) in abd_borrow_buf_copy / abd_return_buf_copy.
 		 * A performance increase of around 5% has been observed for
 		 * ARC-cached reads (of small blocks which can take advantage
 		 * of this).
 		 *
 		 * Note that this optimization is only possible because the
 		 * pages are always mapped into the kernel's address space.
 		 * This is not the case for highmem pages, so the
 		 * optimization can not be made there.
 		 */
 		abd->abd_flags |= ABD_FLAG_LINEAR;
 		abd->abd_flags |= ABD_FLAG_LINEAR_PAGE;
 		abd->abd_u.abd_linear.abd_sgl = table.sgl;
 		ABD_LINEAR_BUF(abd) = page_address(sg_page(table.sgl));
 	} else if (table.nents > 1) {
 		ABDSTAT_BUMP(abdstat_scatter_page_multi_chunk);
 		abd->abd_flags |= ABD_FLAG_MULTI_CHUNK;
 
 		if (zones) {
 			ABDSTAT_BUMP(abdstat_scatter_page_multi_zone);
 			abd->abd_flags |= ABD_FLAG_MULTI_ZONE;
 		}
 
 		ABD_SCATTER(abd).abd_sgl = table.sgl;
 		ABD_SCATTER(abd).abd_nents = table.nents;
 	}
 }
 #else
 
 /*
  * Allocate N individual pages to construct a scatter ABD.  This function
  * makes no attempt to request contiguous pages and requires the minimal
  * number of kernel interfaces.  It's designed for maximum compatibility.
  */
 void
 abd_alloc_chunks(abd_t *abd, size_t size)
 {
 	struct scatterlist *sg = NULL;
 	struct sg_table table;
 	struct page *page;
 	gfp_t gfp = __GFP_NOWARN | GFP_NOIO;
 	int nr_pages = abd_chunkcnt_for_bytes(size);
 	int i = 0;
 
 	while (sg_alloc_table(&table, nr_pages, gfp)) {
 		ABDSTAT_BUMP(abdstat_scatter_sg_table_retry);
 		schedule_timeout_interruptible(1);
 	}
 
 	ASSERT3U(table.nents, ==, nr_pages);
 	ABD_SCATTER(abd).abd_sgl = table.sgl;
 	ABD_SCATTER(abd).abd_nents = nr_pages;
 
 	abd_for_each_sg(abd, sg, nr_pages, i) {
 		while ((page = __page_cache_alloc(gfp)) == NULL) {
 			ABDSTAT_BUMP(abdstat_scatter_page_alloc_retry);
 			schedule_timeout_interruptible(1);
 		}
 
 		ABDSTAT_BUMP(abdstat_scatter_orders[0]);
 		sg_set_page(sg, page, PAGESIZE, 0);
 		abd_mark_zfs_page(page);
 	}
 
 	if (nr_pages > 1) {
 		ABDSTAT_BUMP(abdstat_scatter_page_multi_chunk);
 		abd->abd_flags |= ABD_FLAG_MULTI_CHUNK;
 	}
 }
 #endif /* !CONFIG_HIGHMEM */
 
 /*
  * This must be called if any of the sg_table allocation functions
  * are called.
  */
 static void
 abd_free_sg_table(abd_t *abd)
 {
 	struct sg_table table;
 
 	table.sgl = ABD_SCATTER(abd).abd_sgl;
 	table.nents = table.orig_nents = ABD_SCATTER(abd).abd_nents;
 	sg_free_table(&table);
 }
 
 void
 abd_free_chunks(abd_t *abd)
 {
 	struct scatterlist *sg = NULL;
 	struct page *page;
 	int nr_pages = ABD_SCATTER(abd).abd_nents;
 	int order, i = 0;
 
 	if (abd->abd_flags & ABD_FLAG_MULTI_ZONE)
 		ABDSTAT_BUMPDOWN(abdstat_scatter_page_multi_zone);
 
 	if (abd->abd_flags & ABD_FLAG_MULTI_CHUNK)
 		ABDSTAT_BUMPDOWN(abdstat_scatter_page_multi_chunk);
 
 	abd_for_each_sg(abd, sg, nr_pages, i) {
 		page = sg_page(sg);
 		abd_unmark_zfs_page(page);
 		order = compound_order(page);
 		__free_pages(page, order);
 		ASSERT3U(sg->length, <=, PAGE_SIZE << order);
 		ABDSTAT_BUMPDOWN(abdstat_scatter_orders[order]);
 	}
 	abd_free_sg_table(abd);
 }
 
 /*
  * Allocate scatter ABD of size SPA_MAXBLOCKSIZE, where each page in
  * the scatterlist will be set to the zero'd out buffer abd_zero_page.
  */
 static void
 abd_alloc_zero_scatter(void)
 {
 	struct scatterlist *sg = NULL;
 	struct sg_table table;
 	gfp_t gfp = __GFP_NOWARN | GFP_NOIO;
 	int nr_pages = abd_chunkcnt_for_bytes(SPA_MAXBLOCKSIZE);
 	int i = 0;
 
 #if defined(HAVE_ZERO_PAGE_GPL_ONLY)
 	gfp_t gfp_zero_page = gfp | __GFP_ZERO;
 	while ((abd_zero_page = __page_cache_alloc(gfp_zero_page)) == NULL) {
 		ABDSTAT_BUMP(abdstat_scatter_page_alloc_retry);
 		schedule_timeout_interruptible(1);
 	}
 	abd_mark_zfs_page(abd_zero_page);
 #else
 	abd_zero_page = ZERO_PAGE(0);
 #endif /* HAVE_ZERO_PAGE_GPL_ONLY */
 
 	while (sg_alloc_table(&table, nr_pages, gfp)) {
 		ABDSTAT_BUMP(abdstat_scatter_sg_table_retry);
 		schedule_timeout_interruptible(1);
 	}
 	ASSERT3U(table.nents, ==, nr_pages);
 
 	abd_zero_scatter = abd_alloc_struct(SPA_MAXBLOCKSIZE);
 	abd_zero_scatter->abd_flags |= ABD_FLAG_OWNER;
 	ABD_SCATTER(abd_zero_scatter).abd_offset = 0;
 	ABD_SCATTER(abd_zero_scatter).abd_sgl = table.sgl;
 	ABD_SCATTER(abd_zero_scatter).abd_nents = nr_pages;
 	abd_zero_scatter->abd_size = SPA_MAXBLOCKSIZE;
 	abd_zero_scatter->abd_flags |= ABD_FLAG_MULTI_CHUNK | ABD_FLAG_ZEROS;
 
 	abd_for_each_sg(abd_zero_scatter, sg, nr_pages, i) {
 		sg_set_page(sg, abd_zero_page, PAGESIZE, 0);
 	}
 
 	ABDSTAT_BUMP(abdstat_scatter_cnt);
 	ABDSTAT_INCR(abdstat_scatter_data_size, PAGESIZE);
 	ABDSTAT_BUMP(abdstat_scatter_page_multi_chunk);
 }
 
 #else /* _KERNEL */
 
 #ifndef PAGE_SHIFT
 #define	PAGE_SHIFT (highbit64(PAGESIZE)-1)
 #endif
 
 #define	zfs_kmap_atomic(chunk)		((void *)chunk)
 #define	zfs_kunmap_atomic(addr)		do { (void)(addr); } while (0)
 #define	local_irq_save(flags)		do { (void)(flags); } while (0)
 #define	local_irq_restore(flags)	do { (void)(flags); } while (0)
 #define	nth_page(pg, i) \
 	((struct page *)((void *)(pg) + (i) * PAGESIZE))
 
 struct scatterlist {
 	struct page *page;
 	int length;
 	int end;
 };
 
 static void
 sg_init_table(struct scatterlist *sg, int nr)
 {
 	memset(sg, 0, nr * sizeof (struct scatterlist));
 	sg[nr - 1].end = 1;
 }
 
 /*
  * This must be called if any of the sg_table allocation functions
  * are called.
  */
 static void
 abd_free_sg_table(abd_t *abd)
 {
 	int nents = ABD_SCATTER(abd).abd_nents;
 	vmem_free(ABD_SCATTER(abd).abd_sgl,
 	    nents * sizeof (struct scatterlist));
 }
 
 #define	for_each_sg(sgl, sg, nr, i)	\
 	for ((i) = 0, (sg) = (sgl); (i) < (nr); (i)++, (sg) = sg_next(sg))
 
 static inline void
 sg_set_page(struct scatterlist *sg, struct page *page, unsigned int len,
     unsigned int offset)
 {
 	/* currently we don't use offset */
 	ASSERT(offset == 0);
 	sg->page = page;
 	sg->length = len;
 }
 
 static inline struct page *
 sg_page(struct scatterlist *sg)
 {
 	return (sg->page);
 }
 
 static inline struct scatterlist *
 sg_next(struct scatterlist *sg)
 {
 	if (sg->end)
 		return (NULL);
 
 	return (sg + 1);
 }
 
 void
 abd_alloc_chunks(abd_t *abd, size_t size)
 {
 	unsigned nr_pages = abd_chunkcnt_for_bytes(size);
 	struct scatterlist *sg;
 	int i;
 
 	ABD_SCATTER(abd).abd_sgl = vmem_alloc(nr_pages *
 	    sizeof (struct scatterlist), KM_SLEEP);
 	sg_init_table(ABD_SCATTER(abd).abd_sgl, nr_pages);
 
 	abd_for_each_sg(abd, sg, nr_pages, i) {
 		struct page *p = umem_alloc_aligned(PAGESIZE, 64, KM_SLEEP);
 		sg_set_page(sg, p, PAGESIZE, 0);
 	}
 	ABD_SCATTER(abd).abd_nents = nr_pages;
 }
 
 void
 abd_free_chunks(abd_t *abd)
 {
 	int i, n = ABD_SCATTER(abd).abd_nents;
 	struct scatterlist *sg;
 
 	abd_for_each_sg(abd, sg, n, i) {
 		struct page *p = nth_page(sg_page(sg), 0);
 		umem_free_aligned(p, PAGESIZE);
 	}
 	abd_free_sg_table(abd);
 }
 
 static void
 abd_alloc_zero_scatter(void)
 {
 	unsigned nr_pages = abd_chunkcnt_for_bytes(SPA_MAXBLOCKSIZE);
 	struct scatterlist *sg;
 	int i;
 
 	abd_zero_page = umem_alloc_aligned(PAGESIZE, 64, KM_SLEEP);
 	memset(abd_zero_page, 0, PAGESIZE);
 	abd_zero_scatter = abd_alloc_struct(SPA_MAXBLOCKSIZE);
 	abd_zero_scatter->abd_flags |= ABD_FLAG_OWNER;
 	abd_zero_scatter->abd_flags |= ABD_FLAG_MULTI_CHUNK | ABD_FLAG_ZEROS;
 	ABD_SCATTER(abd_zero_scatter).abd_offset = 0;
 	ABD_SCATTER(abd_zero_scatter).abd_nents = nr_pages;
 	abd_zero_scatter->abd_size = SPA_MAXBLOCKSIZE;
 	ABD_SCATTER(abd_zero_scatter).abd_sgl = vmem_alloc(nr_pages *
 	    sizeof (struct scatterlist), KM_SLEEP);
 
 	sg_init_table(ABD_SCATTER(abd_zero_scatter).abd_sgl, nr_pages);
 
 	abd_for_each_sg(abd_zero_scatter, sg, nr_pages, i) {
 		sg_set_page(sg, abd_zero_page, PAGESIZE, 0);
 	}
 
 	ABDSTAT_BUMP(abdstat_scatter_cnt);
 	ABDSTAT_INCR(abdstat_scatter_data_size, PAGESIZE);
 	ABDSTAT_BUMP(abdstat_scatter_page_multi_chunk);
 }
 
 #endif /* _KERNEL */
 
 boolean_t
 abd_size_alloc_linear(size_t size)
 {
 	return (!zfs_abd_scatter_enabled || size < zfs_abd_scatter_min_size);
 }
 
 void
 abd_update_scatter_stats(abd_t *abd, abd_stats_op_t op)
 {
 	ASSERT(op == ABDSTAT_INCR || op == ABDSTAT_DECR);
 	int waste = P2ROUNDUP(abd->abd_size, PAGESIZE) - abd->abd_size;
 	if (op == ABDSTAT_INCR) {
 		ABDSTAT_BUMP(abdstat_scatter_cnt);
 		ABDSTAT_INCR(abdstat_scatter_data_size, abd->abd_size);
 		ABDSTAT_INCR(abdstat_scatter_chunk_waste, waste);
 		arc_space_consume(waste, ARC_SPACE_ABD_CHUNK_WASTE);
 	} else {
 		ABDSTAT_BUMPDOWN(abdstat_scatter_cnt);
 		ABDSTAT_INCR(abdstat_scatter_data_size, -(int)abd->abd_size);
 		ABDSTAT_INCR(abdstat_scatter_chunk_waste, -waste);
 		arc_space_return(waste, ARC_SPACE_ABD_CHUNK_WASTE);
 	}
 }
 
 void
 abd_update_linear_stats(abd_t *abd, abd_stats_op_t op)
 {
 	ASSERT(op == ABDSTAT_INCR || op == ABDSTAT_DECR);
 	if (op == ABDSTAT_INCR) {
 		ABDSTAT_BUMP(abdstat_linear_cnt);
 		ABDSTAT_INCR(abdstat_linear_data_size, abd->abd_size);
 	} else {
 		ABDSTAT_BUMPDOWN(abdstat_linear_cnt);
 		ABDSTAT_INCR(abdstat_linear_data_size, -(int)abd->abd_size);
 	}
 }
 
 void
 abd_verify_scatter(abd_t *abd)
 {
 	size_t n;
 	int i = 0;
 	struct scatterlist *sg = NULL;
 
 	ASSERT3U(ABD_SCATTER(abd).abd_nents, >, 0);
 	ASSERT3U(ABD_SCATTER(abd).abd_offset, <,
 	    ABD_SCATTER(abd).abd_sgl->length);
 	n = ABD_SCATTER(abd).abd_nents;
 	abd_for_each_sg(abd, sg, n, i) {
 		ASSERT3P(sg_page(sg), !=, NULL);
 	}
 }
 
 static void
 abd_free_zero_scatter(void)
 {
 	ABDSTAT_BUMPDOWN(abdstat_scatter_cnt);
 	ABDSTAT_INCR(abdstat_scatter_data_size, -(int)PAGESIZE);
 	ABDSTAT_BUMPDOWN(abdstat_scatter_page_multi_chunk);
 
 	abd_free_sg_table(abd_zero_scatter);
 	abd_free_struct(abd_zero_scatter);
 	abd_zero_scatter = NULL;
 	ASSERT3P(abd_zero_page, !=, NULL);
 #if defined(_KERNEL)
 #if defined(HAVE_ZERO_PAGE_GPL_ONLY)
 	abd_unmark_zfs_page(abd_zero_page);
 	__free_page(abd_zero_page);
 #endif /* HAVE_ZERO_PAGE_GPL_ONLY */
 #else
 	umem_free_aligned(abd_zero_page, PAGESIZE);
 #endif /* _KERNEL */
 }
 
 static int
 abd_kstats_update(kstat_t *ksp, int rw)
 {
 	abd_stats_t *as = ksp->ks_data;
 
 	if (rw == KSTAT_WRITE)
 		return (EACCES);
 	as->abdstat_struct_size.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_struct_size);
 	as->abdstat_linear_cnt.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_linear_cnt);
 	as->abdstat_linear_data_size.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_linear_data_size);
 	as->abdstat_scatter_cnt.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_cnt);
 	as->abdstat_scatter_data_size.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_data_size);
 	as->abdstat_scatter_chunk_waste.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_chunk_waste);
 	for (int i = 0; i < ABD_MAX_ORDER; i++) {
 		as->abdstat_scatter_orders[i].value.ui64 =
 		    wmsum_value(&abd_sums.abdstat_scatter_orders[i]);
 	}
 	as->abdstat_scatter_page_multi_chunk.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_page_multi_chunk);
 	as->abdstat_scatter_page_multi_zone.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_page_multi_zone);
 	as->abdstat_scatter_page_alloc_retry.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_page_alloc_retry);
 	as->abdstat_scatter_sg_table_retry.value.ui64 =
 	    wmsum_value(&abd_sums.abdstat_scatter_sg_table_retry);
 	return (0);
 }
 
 void
 abd_init(void)
 {
 	int i;
 
 	abd_cache = kmem_cache_create("abd_t", sizeof (abd_t),
 	    0, NULL, NULL, NULL, NULL, NULL, 0);
 
 	wmsum_init(&abd_sums.abdstat_struct_size, 0);
 	wmsum_init(&abd_sums.abdstat_linear_cnt, 0);
 	wmsum_init(&abd_sums.abdstat_linear_data_size, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_cnt, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_data_size, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_chunk_waste, 0);
 	for (i = 0; i < ABD_MAX_ORDER; i++)
 		wmsum_init(&abd_sums.abdstat_scatter_orders[i], 0);
 	wmsum_init(&abd_sums.abdstat_scatter_page_multi_chunk, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_page_multi_zone, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_page_alloc_retry, 0);
 	wmsum_init(&abd_sums.abdstat_scatter_sg_table_retry, 0);
 
 	abd_ksp = kstat_create("zfs", 0, "abdstats", "misc", KSTAT_TYPE_NAMED,
 	    sizeof (abd_stats) / sizeof (kstat_named_t), KSTAT_FLAG_VIRTUAL);
 	if (abd_ksp != NULL) {
 		for (i = 0; i < ABD_MAX_ORDER; i++) {
 			snprintf(abd_stats.abdstat_scatter_orders[i].name,
 			    KSTAT_STRLEN, "scatter_order_%d", i);
 			abd_stats.abdstat_scatter_orders[i].data_type =
 			    KSTAT_DATA_UINT64;
 		}
 		abd_ksp->ks_data = &abd_stats;
 		abd_ksp->ks_update = abd_kstats_update;
 		kstat_install(abd_ksp);
 	}
 
 	abd_alloc_zero_scatter();
 }
 
 void
 abd_fini(void)
 {
 	abd_free_zero_scatter();
 
 	if (abd_ksp != NULL) {
 		kstat_delete(abd_ksp);
 		abd_ksp = NULL;
 	}
 
 	wmsum_fini(&abd_sums.abdstat_struct_size);
 	wmsum_fini(&abd_sums.abdstat_linear_cnt);
 	wmsum_fini(&abd_sums.abdstat_linear_data_size);
 	wmsum_fini(&abd_sums.abdstat_scatter_cnt);
 	wmsum_fini(&abd_sums.abdstat_scatter_data_size);
 	wmsum_fini(&abd_sums.abdstat_scatter_chunk_waste);
 	for (int i = 0; i < ABD_MAX_ORDER; i++)
 		wmsum_fini(&abd_sums.abdstat_scatter_orders[i]);
 	wmsum_fini(&abd_sums.abdstat_scatter_page_multi_chunk);
 	wmsum_fini(&abd_sums.abdstat_scatter_page_multi_zone);
 	wmsum_fini(&abd_sums.abdstat_scatter_page_alloc_retry);
 	wmsum_fini(&abd_sums.abdstat_scatter_sg_table_retry);
 
 	if (abd_cache) {
 		kmem_cache_destroy(abd_cache);
 		abd_cache = NULL;
 	}
 }
 
 void
 abd_free_linear_page(abd_t *abd)
 {
 	/* Transform it back into a scatter ABD for freeing */
 	struct scatterlist *sg = abd->abd_u.abd_linear.abd_sgl;
 	abd->abd_flags &= ~ABD_FLAG_LINEAR;
 	abd->abd_flags &= ~ABD_FLAG_LINEAR_PAGE;
 	ABD_SCATTER(abd).abd_nents = 1;
 	ABD_SCATTER(abd).abd_offset = 0;
 	ABD_SCATTER(abd).abd_sgl = sg;
 	abd_free_chunks(abd);
 
 	abd_update_scatter_stats(abd, ABDSTAT_DECR);
 }
 
 /*
  * If we're going to use this ABD for doing I/O using the block layer, the
  * consumer of the ABD data doesn't care if it's scattered or not, and we don't
  * plan to store this ABD in memory for a long period of time, we should
  * allocate the ABD type that requires the least data copying to do the I/O.
  *
  * On Linux the optimal thing to do would be to use abd_get_offset() and
  * construct a new ABD which shares the original pages thereby eliminating
  * the copy.  But for the moment a new linear ABD is allocated until this
  * performance optimization can be implemented.
  */
 abd_t *
 abd_alloc_for_io(size_t size, boolean_t is_metadata)
 {
 	return (abd_alloc(size, is_metadata));
 }
 
 abd_t *
 abd_get_offset_scatter(abd_t *abd, abd_t *sabd, size_t off,
     size_t size)
 {
 	(void) size;
 	int i = 0;
 	struct scatterlist *sg = NULL;
 
 	abd_verify(sabd);
 	ASSERT3U(off, <=, sabd->abd_size);
 
 	size_t new_offset = ABD_SCATTER(sabd).abd_offset + off;
 
 	if (abd == NULL)
 		abd = abd_alloc_struct(0);
 
 	/*
 	 * Even if this buf is filesystem metadata, we only track that
 	 * if we own the underlying data buffer, which is not true in
 	 * this case. Therefore, we don't ever use ABD_FLAG_META here.
 	 */
 
 	abd_for_each_sg(sabd, sg, ABD_SCATTER(sabd).abd_nents, i) {
 		if (new_offset < sg->length)
 			break;
 		new_offset -= sg->length;
 	}
 
 	ABD_SCATTER(abd).abd_sgl = sg;
 	ABD_SCATTER(abd).abd_offset = new_offset;
 	ABD_SCATTER(abd).abd_nents = ABD_SCATTER(sabd).abd_nents - i;
 
 	return (abd);
 }
 
 /*
  * Initialize the abd_iter.
  */
 void
 abd_iter_init(struct abd_iter *aiter, abd_t *abd)
 {
 	ASSERT(!abd_is_gang(abd));
 	abd_verify(abd);
 	memset(aiter, 0, sizeof (struct abd_iter));
 	aiter->iter_abd = abd;
 	if (!abd_is_linear(abd)) {
 		aiter->iter_offset = ABD_SCATTER(abd).abd_offset;
 		aiter->iter_sg = ABD_SCATTER(abd).abd_sgl;
 	}
 }
 
 /*
  * This is just a helper function to see if we have exhausted the
  * abd_iter and reached the end.
  */
 boolean_t
 abd_iter_at_end(struct abd_iter *aiter)
 {
 	ASSERT3U(aiter->iter_pos, <=, aiter->iter_abd->abd_size);
 	return (aiter->iter_pos == aiter->iter_abd->abd_size);
 }
 
 /*
  * Advance the iterator by a certain amount. Cannot be called when a chunk is
  * in use. This can be safely called when the aiter has already exhausted, in
  * which case this does nothing.
  */
 void
 abd_iter_advance(struct abd_iter *aiter, size_t amount)
 {
 	/*
 	 * Ensure that last chunk is not in use. abd_iterate_*() must clear
 	 * this state (directly or abd_iter_unmap()) before advancing.
 	 */
 	ASSERT3P(aiter->iter_mapaddr, ==, NULL);
 	ASSERT0(aiter->iter_mapsize);
 	ASSERT3P(aiter->iter_page, ==, NULL);
 	ASSERT0(aiter->iter_page_doff);
 	ASSERT0(aiter->iter_page_dsize);
 
 	/* There's nothing left to advance to, so do nothing */
 	if (abd_iter_at_end(aiter))
 		return;
 
 	aiter->iter_pos += amount;
 	aiter->iter_offset += amount;
 	if (!abd_is_linear(aiter->iter_abd)) {
 		while (aiter->iter_offset >= aiter->iter_sg->length) {
 			aiter->iter_offset -= aiter->iter_sg->length;
 			aiter->iter_sg = sg_next(aiter->iter_sg);
 			if (aiter->iter_sg == NULL) {
 				ASSERT0(aiter->iter_offset);
 				break;
 			}
 		}
 	}
 }
 
 /*
  * Map the current chunk into aiter. This can be safely called when the aiter
  * has already exhausted, in which case this does nothing.
  */
 void
 abd_iter_map(struct abd_iter *aiter)
 {
 	void *paddr;
 	size_t offset = 0;
 
 	ASSERT3P(aiter->iter_mapaddr, ==, NULL);
 	ASSERT0(aiter->iter_mapsize);
 
 	/* There's nothing left to iterate over, so do nothing */
 	if (abd_iter_at_end(aiter))
 		return;
 
 	if (abd_is_linear(aiter->iter_abd)) {
 		ASSERT3U(aiter->iter_pos, ==, aiter->iter_offset);
 		offset = aiter->iter_offset;
 		aiter->iter_mapsize = aiter->iter_abd->abd_size - offset;
 		paddr = ABD_LINEAR_BUF(aiter->iter_abd);
 	} else {
 		offset = aiter->iter_offset;
 		aiter->iter_mapsize = MIN(aiter->iter_sg->length - offset,
 		    aiter->iter_abd->abd_size - aiter->iter_pos);
 
 		paddr = zfs_kmap_atomic(sg_page(aiter->iter_sg));
 	}
 
 	aiter->iter_mapaddr = (char *)paddr + offset;
 }
 
 /*
  * Unmap the current chunk from aiter. This can be safely called when the aiter
  * has already exhausted, in which case this does nothing.
  */
 void
 abd_iter_unmap(struct abd_iter *aiter)
 {
 	/* There's nothing left to unmap, so do nothing */
 	if (abd_iter_at_end(aiter))
 		return;
 
 	if (!abd_is_linear(aiter->iter_abd)) {
 		/* LINTED E_FUNC_SET_NOT_USED */
 		zfs_kunmap_atomic(aiter->iter_mapaddr - aiter->iter_offset);
 	}
 
 	ASSERT3P(aiter->iter_mapaddr, !=, NULL);
 	ASSERT3U(aiter->iter_mapsize, >, 0);
 
 	aiter->iter_mapaddr = NULL;
 	aiter->iter_mapsize = 0;
 }
 
 void
 abd_cache_reap_now(void)
 {
 }
 
 #if defined(_KERNEL)
 /*
  * Yield the next page struct and data offset and size within it, without
  * mapping it into the address space.
  */
 void
 abd_iter_page(struct abd_iter *aiter)
 {
 	if (abd_iter_at_end(aiter)) {
 		aiter->iter_page = NULL;
 		aiter->iter_page_doff = 0;
 		aiter->iter_page_dsize = 0;
 		return;
 	}
 
 	struct page *page;
 	size_t doff, dsize;
 
 	if (abd_is_linear(aiter->iter_abd)) {
 		ASSERT3U(aiter->iter_pos, ==, aiter->iter_offset);
 
 		/* memory address at iter_pos */
 		void *paddr = ABD_LINEAR_BUF(aiter->iter_abd) + aiter->iter_pos;
 
 		/* struct page for address */
 		page = is_vmalloc_addr(paddr) ?
 		    vmalloc_to_page(paddr) : virt_to_page(paddr);
 
 		/* offset of address within the page */
 		doff = offset_in_page(paddr);
 
 		/* total data remaining in abd from this position */
 		dsize = aiter->iter_abd->abd_size - aiter->iter_offset;
 	} else {
 		ASSERT(!abd_is_gang(aiter->iter_abd));
 
 		/* current scatter page */
 		page = sg_page(aiter->iter_sg);
 
 		/* position within page */
 		doff = aiter->iter_offset;
 
 		/* remaining data in scatterlist */
 		dsize = MIN(aiter->iter_sg->length - aiter->iter_offset,
 		    aiter->iter_abd->abd_size - aiter->iter_pos);
 	}
 	ASSERT(page);
 
 	if (PageTail(page)) {
 		/*
 		 * This page is part of a "compound page", which is a group of
 		 * pages that can be referenced from a single struct page *.
 		 * Its organised as a "head" page, followed by a series of
 		 * "tail" pages.
 		 *
 		 * In OpenZFS, compound pages are allocated using the
 		 * __GFP_COMP flag, which we get from scatter ABDs and SPL
 		 * vmalloc slabs (ie >16K allocations). So a great many of the
 		 * IO buffers we get are going to be of this type.
 		 *
 		 * The tail pages are just regular PAGE_SIZE pages, and can be
 		 * safely used as-is. However, the head page has length
 		 * covering itself and all the tail pages. If this ABD chunk
 		 * spans multiple pages, then we can use the head page and a
 		 * >PAGE_SIZE length, which is far more efficient.
 		 *
 		 * To do this, we need to adjust the offset to be counted from
 		 * the head page. struct page for compound pages are stored
 		 * contiguously, so we can just adjust by a simple offset.
 		 */
 		struct page *head = compound_head(page);
 		doff += ((page - head) * PAGESIZE);
 		page = head;
 	}
 
 	/* final page and position within it */
 	aiter->iter_page = page;
 	aiter->iter_page_doff = doff;
 
 	/* amount of data in the chunk, up to the end of the page */
 	aiter->iter_page_dsize = MIN(dsize, page_size(page) - doff);
 }
 
+/*
+ * Note: ABD BIO functions only needed to support vdev_classic. See comments in
+ * vdev_disk.c.
+ */
+
 /*
  * bio_nr_pages for ABD.
  * @off is the offset in @abd
  */
 unsigned long
 abd_nr_pages_off(abd_t *abd, unsigned int size, size_t off)
 {
 	unsigned long pos;
 
 	if (abd_is_gang(abd)) {
 		unsigned long count = 0;
 
 		for (abd_t *cabd = abd_gang_get_offset(abd, &off);
 		    cabd != NULL && size != 0;
 		    cabd = list_next(&ABD_GANG(abd).abd_gang_chain, cabd)) {
 			ASSERT3U(off, <, cabd->abd_size);
 			int mysize = MIN(size, cabd->abd_size - off);
 			count += abd_nr_pages_off(cabd, mysize, off);
 			size -= mysize;
 			off = 0;
 		}
 		return (count);
 	}
 
 	if (abd_is_linear(abd))
 		pos = (unsigned long)abd_to_buf(abd) + off;
 	else
 		pos = ABD_SCATTER(abd).abd_offset + off;
 
 	return (((pos + size + PAGESIZE - 1) >> PAGE_SHIFT) -
 	    (pos >> PAGE_SHIFT));
 }
 
 static unsigned int
 bio_map(struct bio *bio, void *buf_ptr, unsigned int bio_size)
 {
 	unsigned int offset, size, i;
 	struct page *page;
 
 	offset = offset_in_page(buf_ptr);
 	for (i = 0; i < bio->bi_max_vecs; i++) {
 		size = PAGE_SIZE - offset;
 
 		if (bio_size <= 0)
 			break;
 
 		if (size > bio_size)
 			size = bio_size;
 
 		if (is_vmalloc_addr(buf_ptr))
 			page = vmalloc_to_page(buf_ptr);
 		else
 			page = virt_to_page(buf_ptr);
 
 		/*
 		 * Some network related block device uses tcp_sendpage, which
 		 * doesn't behave well when using 0-count page, this is a
 		 * safety net to catch them.
 		 */
 		ASSERT3S(page_count(page), >, 0);
 
 		if (bio_add_page(bio, page, size, offset) != size)
 			break;
 
 		buf_ptr += size;
 		bio_size -= size;
 		offset = 0;
 	}
 
 	return (bio_size);
 }
 
 /*
  * bio_map for gang ABD.
  */
 static unsigned int
 abd_gang_bio_map_off(struct bio *bio, abd_t *abd,
     unsigned int io_size, size_t off)
 {
 	ASSERT(abd_is_gang(abd));
 
 	for (abd_t *cabd = abd_gang_get_offset(abd, &off);
 	    cabd != NULL;
 	    cabd = list_next(&ABD_GANG(abd).abd_gang_chain, cabd)) {
 		ASSERT3U(off, <, cabd->abd_size);
 		int size = MIN(io_size, cabd->abd_size - off);
 		int remainder = abd_bio_map_off(bio, cabd, size, off);
 		io_size -= (size - remainder);
 		if (io_size == 0 || remainder > 0)
 			return (io_size);
 		off = 0;
 	}
 	ASSERT0(io_size);
 	return (io_size);
 }
 
 /*
  * bio_map for ABD.
  * @off is the offset in @abd
  * Remaining IO size is returned
  */
 unsigned int
 abd_bio_map_off(struct bio *bio, abd_t *abd,
     unsigned int io_size, size_t off)
 {
 	struct abd_iter aiter;
 
 	ASSERT3U(io_size, <=, abd->abd_size - off);
 	if (abd_is_linear(abd))
 		return (bio_map(bio, ((char *)abd_to_buf(abd)) + off, io_size));
 
 	ASSERT(!abd_is_linear(abd));
 	if (abd_is_gang(abd))
 		return (abd_gang_bio_map_off(bio, abd, io_size, off));
 
 	abd_iter_init(&aiter, abd);
 	abd_iter_advance(&aiter, off);
 
 	for (int i = 0; i < bio->bi_max_vecs; i++) {
 		struct page *pg;
 		size_t len, sgoff, pgoff;
 		struct scatterlist *sg;
 
 		if (io_size <= 0)
 			break;
 
 		sg = aiter.iter_sg;
 		sgoff = aiter.iter_offset;
 		pgoff = sgoff & (PAGESIZE - 1);
 		len = MIN(io_size, PAGESIZE - pgoff);
 		ASSERT(len > 0);
 
 		pg = nth_page(sg_page(sg), sgoff >> PAGE_SHIFT);
 		if (bio_add_page(bio, pg, len, pgoff) != len)
 			break;
 
 		io_size -= len;
 		abd_iter_advance(&aiter, len);
 	}
 
 	return (io_size);
 }
 
 /* Tunable Parameters */
 module_param(zfs_abd_scatter_enabled, int, 0644);
 MODULE_PARM_DESC(zfs_abd_scatter_enabled,
 	"Toggle whether ABD allocations must be linear.");
 module_param(zfs_abd_scatter_min_size, int, 0644);
 MODULE_PARM_DESC(zfs_abd_scatter_min_size,
 	"Minimum size of scatter allocations.");
 /* CSTYLED */
 module_param(zfs_abd_scatter_max_order, uint, 0644);
 MODULE_PARM_DESC(zfs_abd_scatter_max_order,
 	"Maximum order allocation used for a scatter ABD.");
 
 #endif /* _KERNEL */
diff --git a/module/os/linux/zfs/vdev_disk.c b/module/os/linux/zfs/vdev_disk.c
index b0bda5fa2012..957619b87afd 100644
--- a/module/os/linux/zfs/vdev_disk.c
+++ b/module/os/linux/zfs/vdev_disk.c
@@ -1,1176 +1,1187 @@
 /*
  * CDDL HEADER START
  *
  * The contents of this file are subject to the terms of the
  * Common Development and Distribution License (the "License").
  * You may not use this file except in compliance with the License.
  *
  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
  * or https://opensource.org/licenses/CDDL-1.0.
  * See the License for the specific language governing permissions
  * and limitations under the License.
  *
  * When distributing Covered Code, include this CDDL HEADER in each
  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  * If applicable, add the following below this CDDL HEADER, with the
  * fields enclosed by brackets "[]" replaced with your own identifying
  * information: Portions Copyright [yyyy] [name of copyright owner]
  *
  * CDDL HEADER END
  */
 /*
  * Copyright (C) 2008-2010 Lawrence Livermore National Security, LLC.
  * Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
  * Rewritten for Linux by Brian Behlendorf <behlendorf1@llnl.gov>.
  * LLNL-CODE-403049.
  * Copyright (c) 2012, 2019 by Delphix. All rights reserved.
  */
 
 #include <sys/zfs_context.h>
 #include <sys/spa_impl.h>
 #include <sys/vdev_disk.h>
 #include <sys/vdev_impl.h>
 #include <sys/vdev_trim.h>
 #include <sys/abd.h>
 #include <sys/fs/zfs.h>
 #include <sys/zio.h>
 #include <linux/blkpg.h>
 #include <linux/msdos_fs.h>
 #include <linux/vfs_compat.h>
 #ifdef HAVE_LINUX_BLK_CGROUP_HEADER
 #include <linux/blk-cgroup.h>
 #endif
 
 /*
  * Linux 6.8.x uses a bdev_handle as an instance/refcount for an underlying
  * block_device. Since it carries the block_device inside, its convenient to
  * just use the handle as a proxy. For pre-6.8, we just emulate this with
  * a cast, since we don't need any of the other fields inside the handle.
  */
 #ifdef HAVE_BDEV_OPEN_BY_PATH
 typedef struct bdev_handle zfs_bdev_handle_t;
 #define	BDH_BDEV(bdh)		((bdh)->bdev)
 #define	BDH_IS_ERR(bdh)		(IS_ERR(bdh))
 #define	BDH_PTR_ERR(bdh)	(PTR_ERR(bdh))
 #define	BDH_ERR_PTR(err)	(ERR_PTR(err))
 #else
 typedef void zfs_bdev_handle_t;
 #define	BDH_BDEV(bdh)		((struct block_device *)bdh)
 #define	BDH_IS_ERR(bdh)		(IS_ERR(BDH_BDEV(bdh)))
 #define	BDH_PTR_ERR(bdh)	(PTR_ERR(BDH_BDEV(bdh)))
 #define	BDH_ERR_PTR(err)	(ERR_PTR(err))
 #endif
 
 typedef struct vdev_disk {
 	zfs_bdev_handle_t		*vd_bdh;
 	krwlock_t			vd_lock;
 } vdev_disk_t;
 
 /*
  * Unique identifier for the exclusive vdev holder.
  */
 static void *zfs_vdev_holder = VDEV_HOLDER;
 
 /*
  * Wait up to zfs_vdev_open_timeout_ms milliseconds before determining the
  * device is missing. The missing path may be transient since the links
  * can be briefly removed and recreated in response to udev events.
  */
 static uint_t zfs_vdev_open_timeout_ms = 1000;
 
 /*
  * Size of the "reserved" partition, in blocks.
  */
 #define	EFI_MIN_RESV_SIZE	(16 * 1024)
 
-/*
- * Virtual device vector for disks.
- */
-typedef struct dio_request {
-	zio_t			*dr_zio;	/* Parent ZIO */
-	atomic_t		dr_ref;		/* References */
-	int			dr_error;	/* Bio error */
-	int			dr_bio_count;	/* Count of bio's */
-	struct bio		*dr_bio[];	/* Attached bio's */
-} dio_request_t;
-
 /*
  * BIO request failfast mask.
  */
 
 static unsigned int zfs_vdev_failfast_mask = 1;
 
 #ifdef HAVE_BLK_MODE_T
 static blk_mode_t
 #else
 static fmode_t
 #endif
 vdev_bdev_mode(spa_mode_t spa_mode, boolean_t exclusive)
 {
 #ifdef HAVE_BLK_MODE_T
 	blk_mode_t mode = 0;
 
 	if (spa_mode & SPA_MODE_READ)
 		mode |= BLK_OPEN_READ;
 
 	if (spa_mode & SPA_MODE_WRITE)
 		mode |= BLK_OPEN_WRITE;
 
 	if (exclusive)
 		mode |= BLK_OPEN_EXCL;
 #else
 	fmode_t mode = 0;
 
 	if (spa_mode & SPA_MODE_READ)
 		mode |= FMODE_READ;
 
 	if (spa_mode & SPA_MODE_WRITE)
 		mode |= FMODE_WRITE;
 
 	if (exclusive)
 		mode |= FMODE_EXCL;
 #endif
 
 	return (mode);
 }
 
 /*
  * Returns the usable capacity (in bytes) for the partition or disk.
  */
 static uint64_t
 bdev_capacity(struct block_device *bdev)
 {
 	return (i_size_read(bdev->bd_inode));
 }
 
 #if !defined(HAVE_BDEV_WHOLE)
 static inline struct block_device *
 bdev_whole(struct block_device *bdev)
 {
 	return (bdev->bd_contains);
 }
 #endif
 
 #if defined(HAVE_BDEVNAME)
 #define	vdev_bdevname(bdev, name)	bdevname(bdev, name)
 #else
 static inline void
 vdev_bdevname(struct block_device *bdev, char *name)
 {
 	snprintf(name, BDEVNAME_SIZE, "%pg", bdev);
 }
 #endif
 
 /*
  * Returns the maximum expansion capacity of the block device (in bytes).
  *
  * It is possible to expand a vdev when it has been created as a wholedisk
  * and the containing block device has increased in capacity.  Or when the
  * partition containing the pool has been manually increased in size.
  *
  * This function is only responsible for calculating the potential expansion
  * size so it can be reported by 'zpool list'.  The efi_use_whole_disk() is
  * responsible for verifying the expected partition layout in the wholedisk
  * case, and updating the partition table if appropriate.  Once the partition
  * size has been increased the additional capacity will be visible using
  * bdev_capacity().
  *
  * The returned maximum expansion capacity is always expected to be larger, or
  * at the very least equal, to its usable capacity to prevent overestimating
  * the pool expandsize.
  */
 static uint64_t
 bdev_max_capacity(struct block_device *bdev, uint64_t wholedisk)
 {
 	uint64_t psize;
 	int64_t available;
 
 	if (wholedisk && bdev != bdev_whole(bdev)) {
 		/*
 		 * When reporting maximum expansion capacity for a wholedisk
 		 * deduct any capacity which is expected to be lost due to
 		 * alignment restrictions.  Over reporting this value isn't
 		 * harmful and would only result in slightly less capacity
 		 * than expected post expansion.
 		 * The estimated available space may be slightly smaller than
 		 * bdev_capacity() for devices where the number of sectors is
 		 * not a multiple of the alignment size and the partition layout
 		 * is keeping less than PARTITION_END_ALIGNMENT bytes after the
 		 * "reserved" EFI partition: in such cases return the device
 		 * usable capacity.
 		 */
 		available = i_size_read(bdev_whole(bdev)->bd_inode) -
 		    ((EFI_MIN_RESV_SIZE + NEW_START_BLOCK +
 		    PARTITION_END_ALIGNMENT) << SECTOR_BITS);
 		psize = MAX(available, bdev_capacity(bdev));
 	} else {
 		psize = bdev_capacity(bdev);
 	}
 
 	return (psize);
 }
 
 static void
 vdev_disk_error(zio_t *zio)
 {
 	/*
 	 * This function can be called in interrupt context, for instance while
 	 * handling IRQs coming from a misbehaving disk device; use printk()
 	 * which is safe from any context.
 	 */
 	printk(KERN_WARNING "zio pool=%s vdev=%s error=%d type=%d "
 	    "offset=%llu size=%llu flags=%llu\n", spa_name(zio->io_spa),
 	    zio->io_vd->vdev_path, zio->io_error, zio->io_type,
 	    (u_longlong_t)zio->io_offset, (u_longlong_t)zio->io_size,
 	    zio->io_flags);
 }
 
 static void
 vdev_disk_kobj_evt_post(vdev_t *v)
 {
 	vdev_disk_t *vd = v->vdev_tsd;
 	if (vd && vd->vd_bdh) {
 		spl_signal_kobj_evt(BDH_BDEV(vd->vd_bdh));
 	} else {
 		vdev_dbgmsg(v, "vdev_disk_t is NULL for VDEV:%s\n",
 		    v->vdev_path);
 	}
 }
 
 static zfs_bdev_handle_t *
 vdev_blkdev_get_by_path(const char *path, spa_mode_t mode, void *holder)
 {
 #if defined(HAVE_BDEV_OPEN_BY_PATH)
 	return (bdev_open_by_path(path,
 	    vdev_bdev_mode(mode, B_TRUE), holder, NULL));
 #elif defined(HAVE_BLKDEV_GET_BY_PATH_4ARG)
 	return (blkdev_get_by_path(path,
 	    vdev_bdev_mode(mode, B_TRUE), holder, NULL));
 #else
 	return (blkdev_get_by_path(path,
 	    vdev_bdev_mode(mode, B_TRUE), holder));
 #endif
 }
 
 static void
 vdev_blkdev_put(zfs_bdev_handle_t *bdh, spa_mode_t mode, void *holder)
 {
 #if defined(HAVE_BDEV_RELEASE)
 	return (bdev_release(bdh));
 #elif defined(HAVE_BLKDEV_PUT_HOLDER)
 	return (blkdev_put(BDH_BDEV(bdh), holder));
 #else
 	return (blkdev_put(BDH_BDEV(bdh),
 	    vdev_bdev_mode(mode, B_TRUE)));
 #endif
 }
 
 static int
 vdev_disk_open(vdev_t *v, uint64_t *psize, uint64_t *max_psize,
     uint64_t *logical_ashift, uint64_t *physical_ashift)
 {
 	zfs_bdev_handle_t *bdh;
 #ifdef HAVE_BLK_MODE_T
 	blk_mode_t mode = vdev_bdev_mode(spa_mode(v->vdev_spa), B_FALSE);
 #else
 	fmode_t mode = vdev_bdev_mode(spa_mode(v->vdev_spa), B_FALSE);
 #endif
 	hrtime_t timeout = MSEC2NSEC(zfs_vdev_open_timeout_ms);
 	vdev_disk_t *vd;
 
 	/* Must have a pathname and it must be absolute. */
 	if (v->vdev_path == NULL || v->vdev_path[0] != '/') {
 		v->vdev_stat.vs_aux = VDEV_AUX_BAD_LABEL;
 		vdev_dbgmsg(v, "invalid vdev_path");
 		return (SET_ERROR(EINVAL));
 	}
 
 	/*
 	 * Reopen the device if it is currently open.  When expanding a
 	 * partition force re-scanning the partition table if userland
 	 * did not take care of this already. We need to do this while closed
 	 * in order to get an accurate updated block device size.  Then
 	 * since udev may need to recreate the device links increase the
 	 * open retry timeout before reporting the device as unavailable.
 	 */
 	vd = v->vdev_tsd;
 	if (vd) {
 		char disk_name[BDEVNAME_SIZE + 6] = "/dev/";
 		boolean_t reread_part = B_FALSE;
 
 		rw_enter(&vd->vd_lock, RW_WRITER);
 		bdh = vd->vd_bdh;
 		vd->vd_bdh = NULL;
 
 		if (bdh) {
 			struct block_device *bdev = BDH_BDEV(bdh);
 			if (v->vdev_expanding && bdev != bdev_whole(bdev)) {
 				vdev_bdevname(bdev_whole(bdev), disk_name + 5);
 				/*
 				 * If userland has BLKPG_RESIZE_PARTITION,
 				 * then it should have updated the partition
 				 * table already. We can detect this by
 				 * comparing our current physical size
 				 * with that of the device. If they are
 				 * the same, then we must not have
 				 * BLKPG_RESIZE_PARTITION or it failed to
 				 * update the partition table online. We
 				 * fallback to rescanning the partition
 				 * table from the kernel below. However,
 				 * if the capacity already reflects the
 				 * updated partition, then we skip
 				 * rescanning the partition table here.
 				 */
 				if (v->vdev_psize == bdev_capacity(bdev))
 					reread_part = B_TRUE;
 			}
 
 			vdev_blkdev_put(bdh, mode, zfs_vdev_holder);
 		}
 
 		if (reread_part) {
 			bdh = vdev_blkdev_get_by_path(disk_name, mode,
 			    zfs_vdev_holder);
 			if (!BDH_IS_ERR(bdh)) {
 				int error =
 				    vdev_bdev_reread_part(BDH_BDEV(bdh));
 				vdev_blkdev_put(bdh, mode, zfs_vdev_holder);
 				if (error == 0) {
 					timeout = MSEC2NSEC(
 					    zfs_vdev_open_timeout_ms * 2);
 				}
 			}
 		}
 	} else {
 		vd = kmem_zalloc(sizeof (vdev_disk_t), KM_SLEEP);
 
 		rw_init(&vd->vd_lock, NULL, RW_DEFAULT, NULL);
 		rw_enter(&vd->vd_lock, RW_WRITER);
 	}
 
 	/*
 	 * Devices are always opened by the path provided at configuration
 	 * time.  This means that if the provided path is a udev by-id path
 	 * then drives may be re-cabled without an issue.  If the provided
 	 * path is a udev by-path path, then the physical location information
 	 * will be preserved.  This can be critical for more complicated
 	 * configurations where drives are located in specific physical
 	 * locations to maximize the systems tolerance to component failure.
 	 *
 	 * Alternatively, you can provide your own udev rule to flexibly map
 	 * the drives as you see fit.  It is not advised that you use the
 	 * /dev/[hd]d devices which may be reordered due to probing order.
 	 * Devices in the wrong locations will be detected by the higher
 	 * level vdev validation.
 	 *
 	 * The specified paths may be briefly removed and recreated in
 	 * response to udev events.  This should be exceptionally unlikely
 	 * because the zpool command makes every effort to verify these paths
 	 * have already settled prior to reaching this point.  Therefore,
 	 * a ENOENT failure at this point is highly likely to be transient
 	 * and it is reasonable to sleep and retry before giving up.  In
 	 * practice delays have been observed to be on the order of 100ms.
 	 *
 	 * When ERESTARTSYS is returned it indicates the block device is
 	 * a zvol which could not be opened due to the deadlock detection
 	 * logic in zvol_open().  Extend the timeout and retry the open
 	 * subsequent attempts are expected to eventually succeed.
 	 */
 	hrtime_t start = gethrtime();
 	bdh = BDH_ERR_PTR(-ENXIO);
 	while (BDH_IS_ERR(bdh) && ((gethrtime() - start) < timeout)) {
 		bdh = vdev_blkdev_get_by_path(v->vdev_path, mode,
 		    zfs_vdev_holder);
 		if (unlikely(BDH_PTR_ERR(bdh) == -ENOENT)) {
 			/*
 			 * There is no point of waiting since device is removed
 			 * explicitly
 			 */
 			if (v->vdev_removed)
 				break;
 
 			schedule_timeout(MSEC_TO_TICK(10));
 		} else if (unlikely(BDH_PTR_ERR(bdh) == -ERESTARTSYS)) {
 			timeout = MSEC2NSEC(zfs_vdev_open_timeout_ms * 10);
 			continue;
 		} else if (BDH_IS_ERR(bdh)) {
 			break;
 		}
 	}
 
 	if (BDH_IS_ERR(bdh)) {
 		int error = -BDH_PTR_ERR(bdh);
 		vdev_dbgmsg(v, "open error=%d timeout=%llu/%llu", error,
 		    (u_longlong_t)(gethrtime() - start),
 		    (u_longlong_t)timeout);
 		vd->vd_bdh = NULL;
 		v->vdev_tsd = vd;
 		rw_exit(&vd->vd_lock);
 		return (SET_ERROR(error));
 	} else {
 		vd->vd_bdh = bdh;
 		v->vdev_tsd = vd;
 		rw_exit(&vd->vd_lock);
 	}
 
 	struct block_device *bdev = BDH_BDEV(vd->vd_bdh);
 
 	/*  Determine the physical block size */
 	int physical_block_size = bdev_physical_block_size(bdev);
 
 	/*  Determine the logical block size */
 	int logical_block_size = bdev_logical_block_size(bdev);
 
 	/* Clear the nowritecache bit, causes vdev_reopen() to try again. */
 	v->vdev_nowritecache = B_FALSE;
 
 	/* Set when device reports it supports TRIM. */
 	v->vdev_has_trim = bdev_discard_supported(bdev);
 
 	/* Set when device reports it supports secure TRIM. */
 	v->vdev_has_securetrim = bdev_secure_discard_supported(bdev);
 
 	/* Inform the ZIO pipeline that we are non-rotational */
 	v->vdev_nonrot = blk_queue_nonrot(bdev_get_queue(bdev));
 
 	/* Physical volume size in bytes for the partition */
 	*psize = bdev_capacity(bdev);
 
 	/* Physical volume size in bytes including possible expansion space */
 	*max_psize = bdev_max_capacity(bdev, v->vdev_wholedisk);
 
 	/* Based on the minimum sector size set the block size */
 	*physical_ashift = highbit64(MAX(physical_block_size,
 	    SPA_MINBLOCKSIZE)) - 1;
 
 	*logical_ashift = highbit64(MAX(logical_block_size,
 	    SPA_MINBLOCKSIZE)) - 1;
 
 	return (0);
 }
 
 static void
 vdev_disk_close(vdev_t *v)
 {
 	vdev_disk_t *vd = v->vdev_tsd;
 
 	if (v->vdev_reopening || vd == NULL)
 		return;
 
 	if (vd->vd_bdh != NULL) {
 		vdev_blkdev_put(vd->vd_bdh, spa_mode(v->vdev_spa),
 		    zfs_vdev_holder);
 	}
 
 	rw_destroy(&vd->vd_lock);
 	kmem_free(vd, sizeof (vdev_disk_t));
 	v->vdev_tsd = NULL;
 }
 
-static dio_request_t *
-vdev_disk_dio_alloc(int bio_count)
-{
-	dio_request_t *dr = kmem_zalloc(sizeof (dio_request_t) +
-	    sizeof (struct bio *) * bio_count, KM_SLEEP);
-	atomic_set(&dr->dr_ref, 0);
-	dr->dr_bio_count = bio_count;
-	dr->dr_error = 0;
-
-	for (int i = 0; i < dr->dr_bio_count; i++)
-		dr->dr_bio[i] = NULL;
-
-	return (dr);
-}
-
-static void
-vdev_disk_dio_free(dio_request_t *dr)
-{
-	int i;
-
-	for (i = 0; i < dr->dr_bio_count; i++)
-		if (dr->dr_bio[i])
-			bio_put(dr->dr_bio[i]);
-
-	kmem_free(dr, sizeof (dio_request_t) +
-	    sizeof (struct bio *) * dr->dr_bio_count);
-}
-
-static void
-vdev_disk_dio_get(dio_request_t *dr)
-{
-	atomic_inc(&dr->dr_ref);
-}
-
-static void
-vdev_disk_dio_put(dio_request_t *dr)
-{
-	int rc = atomic_dec_return(&dr->dr_ref);
-
-	/*
-	 * Free the dio_request when the last reference is dropped and
-	 * ensure zio_interpret is called only once with the correct zio
-	 */
-	if (rc == 0) {
-		zio_t *zio = dr->dr_zio;
-		int error = dr->dr_error;
-
-		vdev_disk_dio_free(dr);
-
-		if (zio) {
-			zio->io_error = error;
-			ASSERT3S(zio->io_error, >=, 0);
-			if (zio->io_error)
-				vdev_disk_error(zio);
-
-			zio_delay_interrupt(zio);
-		}
-	}
-}
-
-BIO_END_IO_PROTO(vdev_disk_physio_completion, bio, error)
-{
-	dio_request_t *dr = bio->bi_private;
-
-	if (dr->dr_error == 0) {
-#ifdef HAVE_1ARG_BIO_END_IO_T
-		dr->dr_error = BIO_END_IO_ERROR(bio);
-#else
-		if (error)
-			dr->dr_error = -(error);
-		else if (!test_bit(BIO_UPTODATE, &bio->bi_flags))
-			dr->dr_error = EIO;
-#endif
-	}
-
-	/* Drop reference acquired by __vdev_disk_physio */
-	vdev_disk_dio_put(dr);
-}
-
 static inline void
 vdev_submit_bio_impl(struct bio *bio)
 {
 #ifdef HAVE_1ARG_SUBMIT_BIO
 	(void) submit_bio(bio);
 #else
 	(void) submit_bio(bio_data_dir(bio), bio);
 #endif
 }
 
 /*
  * preempt_schedule_notrace is GPL-only which breaks the ZFS build, so
  * replace it with preempt_schedule under the following condition:
  */
 #if defined(CONFIG_ARM64) && \
     defined(CONFIG_PREEMPTION) && \
     defined(CONFIG_BLK_CGROUP)
 #define	preempt_schedule_notrace(x) preempt_schedule(x)
 #endif
 
 /*
  * As for the Linux 5.18 kernel bio_alloc() expects a block_device struct
  * as an argument removing the need to set it with bio_set_dev().  This
  * removes the need for all of the following compatibility code.
  */
 #if !defined(HAVE_BIO_ALLOC_4ARG)
 
 #ifdef HAVE_BIO_SET_DEV
 #if defined(CONFIG_BLK_CGROUP) && defined(HAVE_BIO_SET_DEV_GPL_ONLY)
 /*
  * The Linux 5.5 kernel updated percpu_ref_tryget() which is inlined by
  * blkg_tryget() to use rcu_read_lock() instead of rcu_read_lock_sched().
  * As a side effect the function was converted to GPL-only.  Define our
  * own version when needed which uses rcu_read_lock_sched().
  *
  * The Linux 5.17 kernel split linux/blk-cgroup.h into a private and a public
  * part, moving blkg_tryget into the private one. Define our own version.
  */
 #if defined(HAVE_BLKG_TRYGET_GPL_ONLY) || !defined(HAVE_BLKG_TRYGET)
 static inline bool
 vdev_blkg_tryget(struct blkcg_gq *blkg)
 {
 	struct percpu_ref *ref = &blkg->refcnt;
 	unsigned long __percpu *count;
 	bool rc;
 
 	rcu_read_lock_sched();
 
 	if (__ref_is_percpu(ref, &count)) {
 		this_cpu_inc(*count);
 		rc = true;
 	} else {
 #ifdef ZFS_PERCPU_REF_COUNT_IN_DATA
 		rc = atomic_long_inc_not_zero(&ref->data->count);
 #else
 		rc = atomic_long_inc_not_zero(&ref->count);
 #endif
 	}
 
 	rcu_read_unlock_sched();
 
 	return (rc);
 }
 #else
 #define	vdev_blkg_tryget(bg)	blkg_tryget(bg)
 #endif
 #ifdef HAVE_BIO_SET_DEV_MACRO
 /*
  * The Linux 5.0 kernel updated the bio_set_dev() macro so it calls the
  * GPL-only bio_associate_blkg() symbol thus inadvertently converting
  * the entire macro.  Provide a minimal version which always assigns the
  * request queue's root_blkg to the bio.
  */
 static inline void
 vdev_bio_associate_blkg(struct bio *bio)
 {
 #if defined(HAVE_BIO_BDEV_DISK)
 	struct request_queue *q = bio->bi_bdev->bd_disk->queue;
 #else
 	struct request_queue *q = bio->bi_disk->queue;
 #endif
 
 	ASSERT3P(q, !=, NULL);
 	ASSERT3P(bio->bi_blkg, ==, NULL);
 
 	if (q->root_blkg && vdev_blkg_tryget(q->root_blkg))
 		bio->bi_blkg = q->root_blkg;
 }
 
 #define	bio_associate_blkg vdev_bio_associate_blkg
 #else
 static inline void
 vdev_bio_set_dev(struct bio *bio, struct block_device *bdev)
 {
 #if defined(HAVE_BIO_BDEV_DISK)
 	struct request_queue *q = bdev->bd_disk->queue;
 #else
 	struct request_queue *q = bio->bi_disk->queue;
 #endif
 	bio_clear_flag(bio, BIO_REMAPPED);
 	if (bio->bi_bdev != bdev)
 		bio_clear_flag(bio, BIO_THROTTLED);
 	bio->bi_bdev = bdev;
 
 	ASSERT3P(q, !=, NULL);
 	ASSERT3P(bio->bi_blkg, ==, NULL);
 
 	if (q->root_blkg && vdev_blkg_tryget(q->root_blkg))
 		bio->bi_blkg = q->root_blkg;
 }
 #define	bio_set_dev		vdev_bio_set_dev
 #endif
 #endif
 #else
 /*
  * Provide a bio_set_dev() helper macro for pre-Linux 4.14 kernels.
  */
 static inline void
 bio_set_dev(struct bio *bio, struct block_device *bdev)
 {
 	bio->bi_bdev = bdev;
 }
 #endif /* HAVE_BIO_SET_DEV */
 #endif /* !HAVE_BIO_ALLOC_4ARG */
 
 static inline void
 vdev_submit_bio(struct bio *bio)
 {
 	struct bio_list *bio_list = current->bio_list;
 	current->bio_list = NULL;
 	vdev_submit_bio_impl(bio);
 	current->bio_list = bio_list;
 }
 
 static inline struct bio *
 vdev_bio_alloc(struct block_device *bdev, gfp_t gfp_mask,
     unsigned short nr_vecs)
 {
 	struct bio *bio;
 
 #ifdef HAVE_BIO_ALLOC_4ARG
 	bio = bio_alloc(bdev, nr_vecs, 0, gfp_mask);
 #else
 	bio = bio_alloc(gfp_mask, nr_vecs);
 	if (likely(bio != NULL))
 		bio_set_dev(bio, bdev);
 #endif
 
 	return (bio);
 }
 
+/* ========== */
+
+/*
+ * This is the classic, battle-tested BIO submission code.
+ *
+ * These functions have been renamed to vdev_classic_* to make it clear what
+ * they belong to, but their implementations are unchanged.
+ */
+
+/*
+ * Virtual device vector for disks.
+ */
+typedef struct dio_request {
+	zio_t			*dr_zio;	/* Parent ZIO */
+	atomic_t		dr_ref;		/* References */
+	int			dr_error;	/* Bio error */
+	int			dr_bio_count;	/* Count of bio's */
+	struct bio		*dr_bio[];	/* Attached bio's */
+} dio_request_t;
+
+static dio_request_t *
+vdev_classic_dio_alloc(int bio_count)
+{
+	dio_request_t *dr = kmem_zalloc(sizeof (dio_request_t) +
+	    sizeof (struct bio *) * bio_count, KM_SLEEP);
+	atomic_set(&dr->dr_ref, 0);
+	dr->dr_bio_count = bio_count;
+	dr->dr_error = 0;
+
+	for (int i = 0; i < dr->dr_bio_count; i++)
+		dr->dr_bio[i] = NULL;
+
+	return (dr);
+}
+
+static void
+vdev_classic_dio_free(dio_request_t *dr)
+{
+	int i;
+
+	for (i = 0; i < dr->dr_bio_count; i++)
+		if (dr->dr_bio[i])
+			bio_put(dr->dr_bio[i]);
+
+	kmem_free(dr, sizeof (dio_request_t) +
+	    sizeof (struct bio *) * dr->dr_bio_count);
+}
+
+static void
+vdev_classic_dio_get(dio_request_t *dr)
+{
+	atomic_inc(&dr->dr_ref);
+}
+
+static void
+vdev_classic_dio_put(dio_request_t *dr)
+{
+	int rc = atomic_dec_return(&dr->dr_ref);
+
+	/*
+	 * Free the dio_request when the last reference is dropped and
+	 * ensure zio_interpret is called only once with the correct zio
+	 */
+	if (rc == 0) {
+		zio_t *zio = dr->dr_zio;
+		int error = dr->dr_error;
+
+		vdev_classic_dio_free(dr);
+
+		if (zio) {
+			zio->io_error = error;
+			ASSERT3S(zio->io_error, >=, 0);
+			if (zio->io_error)
+				vdev_disk_error(zio);
+
+			zio_delay_interrupt(zio);
+		}
+	}
+}
+
+BIO_END_IO_PROTO(vdev_classic_physio_completion, bio, error)
+{
+	dio_request_t *dr = bio->bi_private;
+
+	if (dr->dr_error == 0) {
+#ifdef HAVE_1ARG_BIO_END_IO_T
+		dr->dr_error = BIO_END_IO_ERROR(bio);
+#else
+		if (error)
+			dr->dr_error = -(error);
+		else if (!test_bit(BIO_UPTODATE, &bio->bi_flags))
+			dr->dr_error = EIO;
+#endif
+	}
+
+	/* Drop reference acquired by vdev_classic_physio */
+	vdev_classic_dio_put(dr);
+}
+
 static inline unsigned int
-vdev_bio_max_segs(zio_t *zio, int bio_size, uint64_t abd_offset)
+vdev_classic_bio_max_segs(zio_t *zio, int bio_size, uint64_t abd_offset)
 {
 	unsigned long nr_segs = abd_nr_pages_off(zio->io_abd,
 	    bio_size, abd_offset);
 
 #ifdef HAVE_BIO_MAX_SEGS
 	return (bio_max_segs(nr_segs));
 #else
 	return (MIN(nr_segs, BIO_MAX_PAGES));
 #endif
 }
 
 static int
-__vdev_disk_physio(struct block_device *bdev, zio_t *zio,
+vdev_classic_physio(struct block_device *bdev, zio_t *zio,
     size_t io_size, uint64_t io_offset, int rw, int flags)
 {
 	dio_request_t *dr;
 	uint64_t abd_offset;
 	uint64_t bio_offset;
 	int bio_size;
 	int bio_count = 16;
 	int error = 0;
 	struct blk_plug plug;
 	unsigned short nr_vecs;
 
 	/*
 	 * Accessing outside the block device is never allowed.
 	 */
 	if (io_offset + io_size > bdev->bd_inode->i_size) {
 		vdev_dbgmsg(zio->io_vd,
 		    "Illegal access %llu size %llu, device size %llu",
 		    (u_longlong_t)io_offset,
 		    (u_longlong_t)io_size,
 		    (u_longlong_t)i_size_read(bdev->bd_inode));
 		return (SET_ERROR(EIO));
 	}
 
 retry:
-	dr = vdev_disk_dio_alloc(bio_count);
+	dr = vdev_classic_dio_alloc(bio_count);
 
 	if (!(zio->io_flags & (ZIO_FLAG_IO_RETRY | ZIO_FLAG_TRYHARD)) &&
 	    zio->io_vd->vdev_failfast == B_TRUE) {
 		bio_set_flags_failfast(bdev, &flags, zfs_vdev_failfast_mask & 1,
 		    zfs_vdev_failfast_mask & 2, zfs_vdev_failfast_mask & 4);
 	}
 
 	dr->dr_zio = zio;
 
 	/*
 	 * Since bio's can have up to BIO_MAX_PAGES=256 iovec's, each of which
 	 * is at least 512 bytes and at most PAGESIZE (typically 4K), one bio
 	 * can cover at least 128KB and at most 1MB.  When the required number
 	 * of iovec's exceeds this, we are forced to break the IO in multiple
 	 * bio's and wait for them all to complete.  This is likely if the
 	 * recordsize property is increased beyond 1MB.  The default
 	 * bio_count=16 should typically accommodate the maximum-size zio of
 	 * 16MB.
 	 */
 
 	abd_offset = 0;
 	bio_offset = io_offset;
 	bio_size = io_size;
 	for (int i = 0; i <= dr->dr_bio_count; i++) {
 
 		/* Finished constructing bio's for given buffer */
 		if (bio_size <= 0)
 			break;
 
 		/*
 		 * If additional bio's are required, we have to retry, but
 		 * this should be rare - see the comment above.
 		 */
 		if (dr->dr_bio_count == i) {
-			vdev_disk_dio_free(dr);
+			vdev_classic_dio_free(dr);
 			bio_count *= 2;
 			goto retry;
 		}
 
-		nr_vecs = vdev_bio_max_segs(zio, bio_size, abd_offset);
+		nr_vecs = vdev_classic_bio_max_segs(zio, bio_size, abd_offset);
 		dr->dr_bio[i] = vdev_bio_alloc(bdev, GFP_NOIO, nr_vecs);
 		if (unlikely(dr->dr_bio[i] == NULL)) {
-			vdev_disk_dio_free(dr);
+			vdev_classic_dio_free(dr);
 			return (SET_ERROR(ENOMEM));
 		}
 
-		/* Matching put called by vdev_disk_physio_completion */
-		vdev_disk_dio_get(dr);
+		/* Matching put called by vdev_classic_physio_completion */
+		vdev_classic_dio_get(dr);
 
 		BIO_BI_SECTOR(dr->dr_bio[i]) = bio_offset >> 9;
-		dr->dr_bio[i]->bi_end_io = vdev_disk_physio_completion;
+		dr->dr_bio[i]->bi_end_io = vdev_classic_physio_completion;
 		dr->dr_bio[i]->bi_private = dr;
 		bio_set_op_attrs(dr->dr_bio[i], rw, flags);
 
 		/* Remaining size is returned to become the new size */
 		bio_size = abd_bio_map_off(dr->dr_bio[i], zio->io_abd,
 		    bio_size, abd_offset);
 
 		/* Advance in buffer and construct another bio if needed */
 		abd_offset += BIO_BI_SIZE(dr->dr_bio[i]);
 		bio_offset += BIO_BI_SIZE(dr->dr_bio[i]);
 	}
 
 	/* Extra reference to protect dio_request during vdev_submit_bio */
-	vdev_disk_dio_get(dr);
+	vdev_classic_dio_get(dr);
 
 	if (dr->dr_bio_count > 1)
 		blk_start_plug(&plug);
 
 	/* Submit all bio's associated with this dio */
 	for (int i = 0; i < dr->dr_bio_count; i++) {
 		if (dr->dr_bio[i])
 			vdev_submit_bio(dr->dr_bio[i]);
 	}
 
 	if (dr->dr_bio_count > 1)
 		blk_finish_plug(&plug);
 
-	vdev_disk_dio_put(dr);
+	vdev_classic_dio_put(dr);
 
 	return (error);
 }
 
+/* ========== */
+
 BIO_END_IO_PROTO(vdev_disk_io_flush_completion, bio, error)
 {
 	zio_t *zio = bio->bi_private;
 #ifdef HAVE_1ARG_BIO_END_IO_T
 	zio->io_error = BIO_END_IO_ERROR(bio);
 #else
 	zio->io_error = -error;
 #endif
 
 	if (zio->io_error && (zio->io_error == EOPNOTSUPP))
 		zio->io_vd->vdev_nowritecache = B_TRUE;
 
 	bio_put(bio);
 	ASSERT3S(zio->io_error, >=, 0);
 	if (zio->io_error)
 		vdev_disk_error(zio);
 	zio_interrupt(zio);
 }
 
 static int
 vdev_disk_io_flush(struct block_device *bdev, zio_t *zio)
 {
 	struct request_queue *q;
 	struct bio *bio;
 
 	q = bdev_get_queue(bdev);
 	if (!q)
 		return (SET_ERROR(ENXIO));
 
 	bio = vdev_bio_alloc(bdev, GFP_NOIO, 0);
 	if (unlikely(bio == NULL))
 		return (SET_ERROR(ENOMEM));
 
 	bio->bi_end_io = vdev_disk_io_flush_completion;
 	bio->bi_private = zio;
 	bio_set_flush(bio);
 	vdev_submit_bio(bio);
 	invalidate_bdev(bdev);
 
 	return (0);
 }
 
 #if defined(HAVE_BLKDEV_ISSUE_SECURE_ERASE) || \
 	defined(HAVE_BLKDEV_ISSUE_DISCARD_ASYNC)
 BIO_END_IO_PROTO(vdev_disk_discard_end_io, bio, error)
 {
 	zio_t *zio = bio->bi_private;
 #ifdef HAVE_1ARG_BIO_END_IO_T
 	zio->io_error = BIO_END_IO_ERROR(bio);
 #else
 	zio->io_error = -error;
 #endif
 	bio_put(bio);
 	if (zio->io_error)
 		vdev_disk_error(zio);
 	zio_interrupt(zio);
 }
 
 static int
 vdev_issue_discard_trim(zio_t *zio, unsigned long flags)
 {
 	int ret;
 	struct bio *bio = NULL;
 
 #if defined(BLKDEV_DISCARD_SECURE)
 	ret = - __blkdev_issue_discard(
 	    BDH_BDEV(((vdev_disk_t *)zio->io_vd->vdev_tsd)->vd_bdh),
 	    zio->io_offset >> 9, zio->io_size >> 9, GFP_NOFS, flags, &bio);
 #else
 	(void) flags;
 	ret = - __blkdev_issue_discard(
 	    BDH_BDEV(((vdev_disk_t *)zio->io_vd->vdev_tsd)->vd_bdh),
 	    zio->io_offset >> 9, zio->io_size >> 9, GFP_NOFS, &bio);
 #endif
 	if (!ret && bio) {
 		bio->bi_private = zio;
 		bio->bi_end_io = vdev_disk_discard_end_io;
 		vdev_submit_bio(bio);
 	}
 	return (ret);
 }
 #endif
 
 static int
 vdev_disk_io_trim(zio_t *zio)
 {
 	unsigned long trim_flags = 0;
 	if (zio->io_trim_flags & ZIO_TRIM_SECURE) {
 #if defined(HAVE_BLKDEV_ISSUE_SECURE_ERASE)
 		return (-blkdev_issue_secure_erase(
 		    BDH_BDEV(((vdev_disk_t *)zio->io_vd->vdev_tsd)->vd_bdh),
 		    zio->io_offset >> 9, zio->io_size >> 9, GFP_NOFS));
 #elif defined(BLKDEV_DISCARD_SECURE)
 		trim_flags |= BLKDEV_DISCARD_SECURE;
 #endif
 	}
 #if defined(HAVE_BLKDEV_ISSUE_SECURE_ERASE) || \
 	defined(HAVE_BLKDEV_ISSUE_DISCARD_ASYNC)
 	return (vdev_issue_discard_trim(zio, trim_flags));
 #elif defined(HAVE_BLKDEV_ISSUE_DISCARD)
 	return (-blkdev_issue_discard(
 	    BDH_BDEV(((vdev_disk_t *)zio->io_vd->vdev_tsd)->vd_bdh),
 	    zio->io_offset >> 9, zio->io_size >> 9, GFP_NOFS, trim_flags));
 #else
 #error "Unsupported kernel"
 #endif
 }
 
 static void
 vdev_disk_io_start(zio_t *zio)
 {
 	vdev_t *v = zio->io_vd;
 	vdev_disk_t *vd = v->vdev_tsd;
 	int rw, error;
 
 	/*
 	 * If the vdev is closed, it's likely in the REMOVED or FAULTED state.
 	 * Nothing to be done here but return failure.
 	 */
 	if (vd == NULL) {
 		zio->io_error = ENXIO;
 		zio_interrupt(zio);
 		return;
 	}
 
 	rw_enter(&vd->vd_lock, RW_READER);
 
 	/*
 	 * If the vdev is closed, it's likely due to a failed reopen and is
 	 * in the UNAVAIL state.  Nothing to be done here but return failure.
 	 */
 	if (vd->vd_bdh == NULL) {
 		rw_exit(&vd->vd_lock);
 		zio->io_error = ENXIO;
 		zio_interrupt(zio);
 		return;
 	}
 
 	switch (zio->io_type) {
 	case ZIO_TYPE_IOCTL:
 
 		if (!vdev_readable(v)) {
 			rw_exit(&vd->vd_lock);
 			zio->io_error = SET_ERROR(ENXIO);
 			zio_interrupt(zio);
 			return;
 		}
 
 		switch (zio->io_cmd) {
 		case DKIOCFLUSHWRITECACHE:
 
 			if (zfs_nocacheflush)
 				break;
 
 			if (v->vdev_nowritecache) {
 				zio->io_error = SET_ERROR(ENOTSUP);
 				break;
 			}
 
 			error = vdev_disk_io_flush(BDH_BDEV(vd->vd_bdh), zio);
 			if (error == 0) {
 				rw_exit(&vd->vd_lock);
 				return;
 			}
 
 			zio->io_error = error;
 
 			break;
 
 		default:
 			zio->io_error = SET_ERROR(ENOTSUP);
 		}
 
 		rw_exit(&vd->vd_lock);
 		zio_execute(zio);
 		return;
 	case ZIO_TYPE_WRITE:
 		rw = WRITE;
 		break;
 
 	case ZIO_TYPE_READ:
 		rw = READ;
 		break;
 
 	case ZIO_TYPE_TRIM:
 		zio->io_error = vdev_disk_io_trim(zio);
 		rw_exit(&vd->vd_lock);
 #if defined(HAVE_BLKDEV_ISSUE_SECURE_ERASE)
 		if (zio->io_trim_flags & ZIO_TRIM_SECURE)
 			zio_interrupt(zio);
 #elif defined(HAVE_BLKDEV_ISSUE_DISCARD)
 		zio_interrupt(zio);
 #endif
 		return;
 
 	default:
 		rw_exit(&vd->vd_lock);
 		zio->io_error = SET_ERROR(ENOTSUP);
 		zio_interrupt(zio);
 		return;
 	}
 
 	zio->io_target_timestamp = zio_handle_io_delay(zio);
-	error = __vdev_disk_physio(BDH_BDEV(vd->vd_bdh), zio,
+	error = vdev_classic_physio(BDH_BDEV(vd->vd_bdh), zio,
 	    zio->io_size, zio->io_offset, rw, 0);
 	rw_exit(&vd->vd_lock);
 
 	if (error) {
 		zio->io_error = error;
 		zio_interrupt(zio);
 		return;
 	}
 }
 
 static void
 vdev_disk_io_done(zio_t *zio)
 {
 	/*
 	 * If the device returned EIO, we revalidate the media.  If it is
 	 * determined the media has changed this triggers the asynchronous
 	 * removal of the device from the configuration.
 	 */
 	if (zio->io_error == EIO) {
 		vdev_t *v = zio->io_vd;
 		vdev_disk_t *vd = v->vdev_tsd;
 
 		if (!zfs_check_disk_status(BDH_BDEV(vd->vd_bdh))) {
 			invalidate_bdev(BDH_BDEV(vd->vd_bdh));
 			v->vdev_remove_wanted = B_TRUE;
 			spa_async_request(zio->io_spa, SPA_ASYNC_REMOVE);
 		}
 	}
 }
 
 static void
 vdev_disk_hold(vdev_t *vd)
 {
 	ASSERT(spa_config_held(vd->vdev_spa, SCL_STATE, RW_WRITER));
 
 	/* We must have a pathname, and it must be absolute. */
 	if (vd->vdev_path == NULL || vd->vdev_path[0] != '/')
 		return;
 
 	/*
 	 * Only prefetch path and devid info if the device has
 	 * never been opened.
 	 */
 	if (vd->vdev_tsd != NULL)
 		return;
 
 }
 
 static void
 vdev_disk_rele(vdev_t *vd)
 {
 	ASSERT(spa_config_held(vd->vdev_spa, SCL_STATE, RW_WRITER));
 
 	/* XXX: Implement me as a vnode rele for the device */
 }
 
 vdev_ops_t vdev_disk_ops = {
 	.vdev_op_init = NULL,
 	.vdev_op_fini = NULL,
 	.vdev_op_open = vdev_disk_open,
 	.vdev_op_close = vdev_disk_close,
 	.vdev_op_asize = vdev_default_asize,
 	.vdev_op_min_asize = vdev_default_min_asize,
 	.vdev_op_min_alloc = NULL,
 	.vdev_op_io_start = vdev_disk_io_start,
 	.vdev_op_io_done = vdev_disk_io_done,
 	.vdev_op_state_change = NULL,
 	.vdev_op_need_resilver = NULL,
 	.vdev_op_hold = vdev_disk_hold,
 	.vdev_op_rele = vdev_disk_rele,
 	.vdev_op_remap = NULL,
 	.vdev_op_xlate = vdev_default_xlate,
 	.vdev_op_rebuild_asize = NULL,
 	.vdev_op_metaslab_init = NULL,
 	.vdev_op_config_generate = NULL,
 	.vdev_op_nparity = NULL,
 	.vdev_op_ndisks = NULL,
 	.vdev_op_type = VDEV_TYPE_DISK,		/* name of this vdev type */
 	.vdev_op_leaf = B_TRUE,			/* leaf vdev */
 	.vdev_op_kobj_evt_post = vdev_disk_kobj_evt_post
 };
 
 /*
  * The zfs_vdev_scheduler module option has been deprecated. Setting this
  * value no longer has any effect.  It has not yet been entirely removed
  * to allow the module to be loaded if this option is specified in the
  * /etc/modprobe.d/zfs.conf file.  The following warning will be logged.
  */
 static int
 param_set_vdev_scheduler(const char *val, zfs_kernel_param_t *kp)
 {
 	int error = param_set_charp(val, kp);
 	if (error == 0) {
 		printk(KERN_INFO "The 'zfs_vdev_scheduler' module option "
 		    "is not supported.\n");
 	}
 
 	return (error);
 }
 
 static const char *zfs_vdev_scheduler = "unused";
 module_param_call(zfs_vdev_scheduler, param_set_vdev_scheduler,
     param_get_charp, &zfs_vdev_scheduler, 0644);
 MODULE_PARM_DESC(zfs_vdev_scheduler, "I/O scheduler");
 
 int
 param_set_min_auto_ashift(const char *buf, zfs_kernel_param_t *kp)
 {
 	uint_t val;
 	int error;
 
 	error = kstrtouint(buf, 0, &val);
 	if (error < 0)
 		return (SET_ERROR(error));
 
 	if (val < ASHIFT_MIN || val > zfs_vdev_max_auto_ashift)
 		return (SET_ERROR(-EINVAL));
 
 	error = param_set_uint(buf, kp);
 	if (error < 0)
 		return (SET_ERROR(error));
 
 	return (0);
 }
 
 int
 param_set_max_auto_ashift(const char *buf, zfs_kernel_param_t *kp)
 {
 	uint_t val;
 	int error;
 
 	error = kstrtouint(buf, 0, &val);
 	if (error < 0)
 		return (SET_ERROR(error));
 
 	if (val > ASHIFT_MAX || val < zfs_vdev_min_auto_ashift)
 		return (SET_ERROR(-EINVAL));
 
 	error = param_set_uint(buf, kp);
 	if (error < 0)
 		return (SET_ERROR(error));
 
 	return (0);
 }
 
 ZFS_MODULE_PARAM(zfs_vdev, zfs_vdev_, open_timeout_ms, UINT, ZMOD_RW,
 	"Timeout before determining that a device is missing");
 
 ZFS_MODULE_PARAM(zfs_vdev, zfs_vdev_, failfast_mask, UINT, ZMOD_RW,
 	"Defines failfast mask: 1 - device, 2 - transport, 4 - driver");