Index: head/sys/arm/arm/busdma_machdep.c
===================================================================
--- head/sys/arm/arm/busdma_machdep.c	(revision 365705)
+++ head/sys/arm/arm/busdma_machdep.c	(revision 365706)
@@ -1,1781 +1,1750 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2012-2015 Ian Lepore
  * Copyright (c) 2010 Mark Tinguely
  * Copyright (c) 2004 Olivier Houchard
  * Copyright (c) 2002 Peter Grehan
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  *  From i386/busdma_machdep.c 191438 2009-04-23 20:24:19Z jhb
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/busdma_bufalloc.h>
 #include <sys/counter.h>
 #include <sys/interrupt.h>
 #include <sys/kernel.h>
 #include <sys/ktr.h>
 #include <sys/lock.h>
 #include <sys/memdesc.h>
 #include <sys/proc.h>
 #include <sys/mutex.h>
 #include <sys/sysctl.h>
 #include <sys/uio.h>
 
 #include <vm/vm.h>
 #include <vm/vm_param.h>
 #include <vm/vm_page.h>
 #include <vm/vm_phys.h>
 #include <vm/vm_map.h>
 #include <vm/vm_extern.h>
 #include <vm/vm_kern.h>
 
 #include <machine/atomic.h>
 #include <machine/bus.h>
 #include <machine/cpu.h>
 #include <machine/md_var.h>
 
 #define	BUSDMA_DCACHE_ALIGN	cpuinfo.dcache_line_size
 #define	BUSDMA_DCACHE_MASK	cpuinfo.dcache_line_mask
 
 #define	MAX_BPAGES		64
 #define	MAX_DMA_SEGMENTS	4096
 #define	BUS_DMA_EXCL_BOUNCE	BUS_DMA_BUS2
 #define	BUS_DMA_ALIGN_BOUNCE	BUS_DMA_BUS3
 #define	BUS_DMA_COULD_BOUNCE	(BUS_DMA_EXCL_BOUNCE | BUS_DMA_ALIGN_BOUNCE)
 #define	BUS_DMA_MIN_ALLOC_COMP	BUS_DMA_BUS4
 
 struct bounce_zone;
 
 struct bus_dma_tag {
 	bus_dma_tag_t		parent;
 	bus_size_t		alignment;
 	bus_addr_t		boundary;
 	bus_addr_t		lowaddr;
 	bus_addr_t		highaddr;
 	bus_dma_filter_t	*filter;
 	void			*filterarg;
 	bus_size_t		maxsize;
 	u_int			nsegments;
 	bus_size_t		maxsegsz;
 	int			flags;
 	int			ref_count;
 	int			map_count;
 	bus_dma_lock_t		*lockfunc;
 	void			*lockfuncarg;
 	struct bounce_zone	*bounce_zone;
 };
 
 struct bounce_page {
 	vm_offset_t	vaddr;		/* kva of bounce buffer */
 	bus_addr_t	busaddr;	/* Physical address */
 	vm_offset_t	datavaddr;	/* kva of client data */
 	vm_page_t	datapage;	/* physical page of client data */
 	vm_offset_t	dataoffs;	/* page offset of client data */
 	bus_size_t	datacount;	/* client data count */
 	STAILQ_ENTRY(bounce_page) links;
 };
 
 struct sync_list {
 	vm_offset_t	vaddr;		/* kva of client data */
 	bus_addr_t	paddr;		/* physical address */
 	vm_page_t	pages;		/* starting page of client data */
 	bus_size_t	datacount;	/* client data count */
 };
 
 int busdma_swi_pending;
 
 struct bounce_zone {
 	STAILQ_ENTRY(bounce_zone) links;
 	STAILQ_HEAD(bp_list, bounce_page) bounce_page_list;
 	int		total_bpages;
 	int		free_bpages;
 	int		reserved_bpages;
 	int		active_bpages;
 	int		total_bounced;
 	int		total_deferred;
 	int		map_count;
 	bus_size_t	alignment;
 	bus_addr_t	lowaddr;
 	char		zoneid[8];
 	char		lowaddrid[20];
 	struct sysctl_ctx_list sysctl_tree;
 	struct sysctl_oid *sysctl_tree_top;
 };
 
 static struct mtx bounce_lock;
 static int total_bpages;
 static int busdma_zonecount;
 static uint32_t tags_total;
 static uint32_t maps_total;
 static uint32_t maps_dmamem;
 static uint32_t maps_coherent;
 static counter_u64_t maploads_total;
 static counter_u64_t maploads_bounced;
 static counter_u64_t maploads_coherent;
 static counter_u64_t maploads_dmamem;
 static counter_u64_t maploads_mbuf;
 static counter_u64_t maploads_physmem;
 
 static STAILQ_HEAD(, bounce_zone) bounce_zone_list;
 
 SYSCTL_NODE(_hw, OID_AUTO, busdma, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
     "Busdma parameters");
 SYSCTL_UINT(_hw_busdma, OID_AUTO, tags_total, CTLFLAG_RD, &tags_total, 0,
    "Number of active tags");
 SYSCTL_UINT(_hw_busdma, OID_AUTO, maps_total, CTLFLAG_RD, &maps_total, 0,
    "Number of active maps");
 SYSCTL_UINT(_hw_busdma, OID_AUTO, maps_dmamem, CTLFLAG_RD, &maps_dmamem, 0,
    "Number of active maps for bus_dmamem_alloc buffers");
 SYSCTL_UINT(_hw_busdma, OID_AUTO, maps_coherent, CTLFLAG_RD, &maps_coherent, 0,
    "Number of active maps with BUS_DMA_COHERENT flag set");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_total, CTLFLAG_RD,
     &maploads_total, "Number of load operations performed");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_bounced, CTLFLAG_RD,
     &maploads_bounced, "Number of load operations that used bounce buffers");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_coherent, CTLFLAG_RD,
     &maploads_dmamem, "Number of load operations on BUS_DMA_COHERENT memory");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_dmamem, CTLFLAG_RD,
     &maploads_dmamem, "Number of load operations on bus_dmamem_alloc buffers");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_mbuf, CTLFLAG_RD,
     &maploads_mbuf, "Number of load operations for mbufs");
 SYSCTL_COUNTER_U64(_hw_busdma, OID_AUTO, maploads_physmem, CTLFLAG_RD,
     &maploads_physmem, "Number of load operations on physical buffers");
 SYSCTL_INT(_hw_busdma, OID_AUTO, total_bpages, CTLFLAG_RD, &total_bpages, 0,
    "Total bounce pages");
 
 struct bus_dmamap {
 	struct bp_list		bpages;
 	int			pagesneeded;
 	int			pagesreserved;
 	bus_dma_tag_t		dmat;
 	struct memdesc		mem;
 	bus_dmamap_callback_t	*callback;
 	void			*callback_arg;
 	int			flags;
 #define	DMAMAP_COHERENT		(1 << 0)
 #define	DMAMAP_DMAMEM_ALLOC	(1 << 1)
 #define	DMAMAP_MBUF		(1 << 2)
 	STAILQ_ENTRY(bus_dmamap) links;
 	bus_dma_segment_t	*segments;
 	int			sync_count;
 	struct sync_list	slist[];
 };
 
 static STAILQ_HEAD(, bus_dmamap) bounce_map_waitinglist;
 static STAILQ_HEAD(, bus_dmamap) bounce_map_callbacklist;
 
 static void init_bounce_pages(void *dummy);
 static int alloc_bounce_zone(bus_dma_tag_t dmat);
 static int alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages);
 static int reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map,
     int commit);
 static bus_addr_t add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map,
     vm_offset_t vaddr, bus_addr_t addr, bus_size_t size);
 static void free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage);
 static void _bus_dmamap_count_pages(bus_dma_tag_t dmat, pmap_t pmap,
     bus_dmamap_t map, void *buf, bus_size_t buflen, int flags);
 static void _bus_dmamap_count_phys(bus_dma_tag_t dmat, bus_dmamap_t map,
     vm_paddr_t buf, bus_size_t buflen, int flags);
 static int _bus_dmamap_reserve_pages(bus_dma_tag_t dmat, bus_dmamap_t map,
     int flags);
 static void dma_preread_safe(vm_offset_t va, vm_paddr_t pa, vm_size_t size);
 static void dma_dcache_sync(struct sync_list *sl, bus_dmasync_op_t op);
 
 static busdma_bufalloc_t coherent_allocator;	/* Cache of coherent buffers */
 static busdma_bufalloc_t standard_allocator;	/* Cache of standard buffers */
 
 MALLOC_DEFINE(M_BUSDMA, "busdma", "busdma metadata");
 MALLOC_DEFINE(M_BOUNCE, "bounce", "busdma bounce pages");
 
 static void
 busdma_init(void *dummy)
 {
 	int uma_flags;
 
 	maploads_total    = counter_u64_alloc(M_WAITOK);
 	maploads_bounced  = counter_u64_alloc(M_WAITOK);
 	maploads_coherent = counter_u64_alloc(M_WAITOK);
 	maploads_dmamem   = counter_u64_alloc(M_WAITOK);
 	maploads_mbuf     = counter_u64_alloc(M_WAITOK);
 	maploads_physmem  = counter_u64_alloc(M_WAITOK);
 
 	uma_flags = 0;
 
 	/* Create a cache of buffers in standard (cacheable) memory. */
 	standard_allocator = busdma_bufalloc_create("buffer",
 	    BUSDMA_DCACHE_ALIGN,/* minimum_alignment */
 	    NULL,		/* uma_alloc func */
 	    NULL,		/* uma_free func */
 	    uma_flags);		/* uma_zcreate_flags */
 
 #ifdef INVARIANTS
 	/*
 	 * Force UMA zone to allocate service structures like
 	 * slabs using own allocator. uma_debug code performs
 	 * atomic ops on uma_slab_t fields and safety of this
 	 * operation is not guaranteed for write-back caches
 	 */
 	uma_flags = UMA_ZONE_NOTOUCH;
 #endif
 	/*
 	 * Create a cache of buffers in uncacheable memory, to implement the
 	 * BUS_DMA_COHERENT (and potentially BUS_DMA_NOCACHE) flag.
 	 */
 	coherent_allocator = busdma_bufalloc_create("coherent",
 	    BUSDMA_DCACHE_ALIGN,/* minimum_alignment */
 	    busdma_bufalloc_alloc_uncacheable,
 	    busdma_bufalloc_free_uncacheable,
 	    uma_flags);	/* uma_zcreate_flags */
 }
 
 /*
  * This init historically used SI_SUB_VM, but now the init code requires
  * malloc(9) using M_BUSDMA memory and the pcpu zones for counter(9), which get
  * set up by SI_SUB_KMEM and SI_ORDER_LAST, so we'll go right after that by
  * using SI_SUB_KMEM+1.
  */
 SYSINIT(busdma, SI_SUB_KMEM+1, SI_ORDER_FIRST, busdma_init, NULL);
 
 /*
  * This routine checks the exclusion zone constraints from a tag against the
  * physical RAM available on the machine.  If a tag specifies an exclusion zone
  * but there's no RAM in that zone, then we avoid allocating resources to bounce
  * a request, and we can use any memory allocator (as opposed to needing
  * kmem_alloc_contig() just because it can allocate pages in an address range).
  *
  * Most tags have BUS_SPACE_MAXADDR or BUS_SPACE_MAXADDR_32BIT (they are the
  * same value on 32-bit architectures) as their lowaddr constraint, and we can't
  * possibly have RAM at an address higher than the highest address we can
  * express, so we take a fast out.
  */
 static int
 exclusion_bounce_check(vm_offset_t lowaddr, vm_offset_t highaddr)
 {
 	int i;
 
 	if (lowaddr >= BUS_SPACE_MAXADDR)
 		return (0);
 
 	for (i = 0; phys_avail[i] && phys_avail[i + 1]; i += 2) {
 		if ((lowaddr >= phys_avail[i] && lowaddr < phys_avail[i + 1]) ||
 		    (lowaddr < phys_avail[i] && highaddr >= phys_avail[i]))
 			return (1);
 	}
 	return (0);
 }
 
 /*
  * Return true if the tag has an exclusion zone that could lead to bouncing.
  */
 static __inline int
 exclusion_bounce(bus_dma_tag_t dmat)
 {
 
 	return (dmat->flags & BUS_DMA_EXCL_BOUNCE);
 }
 
 /*
  * Return true if the given address does not fall on the alignment boundary.
  */
 static __inline int
 alignment_bounce(bus_dma_tag_t dmat, bus_addr_t addr)
 {
 
 	return (addr & (dmat->alignment - 1));
 }
 
 /*
  * Return true if the DMA should bounce because the start or end does not fall
  * on a cacheline boundary (which would require a partial cacheline flush).
  * COHERENT memory doesn't trigger cacheline flushes.  Memory allocated by
  * bus_dmamem_alloc() is always aligned to cacheline boundaries, and there's a
  * strict rule that such memory cannot be accessed by the CPU while DMA is in
  * progress (or by multiple DMA engines at once), so that it's always safe to do
  * full cacheline flushes even if that affects memory outside the range of a
  * given DMA operation that doesn't involve the full allocated buffer.  If we're
  * mapping an mbuf, that follows the same rules as a buffer we allocated.
  */
 static __inline int
 cacheline_bounce(bus_dmamap_t map, bus_addr_t addr, bus_size_t size)
 {
 
 	if (map->flags & (DMAMAP_DMAMEM_ALLOC | DMAMAP_COHERENT | DMAMAP_MBUF))
 		return (0);
 	return ((addr | size) & BUSDMA_DCACHE_MASK);
 }
 
 /*
  * Return true if we might need to bounce the DMA described by addr and size.
  *
  * This is used to quick-check whether we need to do the more expensive work of
  * checking the DMA page-by-page looking for alignment and exclusion bounces.
  *
  * Note that the addr argument might be either virtual or physical.  It doesn't
  * matter because we only look at the low-order bits, which are the same in both
  * address spaces and maximum alignment of generic buffer is limited up to page
  * size.
  * Bouncing of buffers allocated by bus_dmamem_alloc()is not necessary, these
  * always comply with the required rules (alignment, boundary, and address
  * range).
  */
 static __inline int
 might_bounce(bus_dma_tag_t dmat, bus_dmamap_t map, bus_addr_t addr,
     bus_size_t size)
 {
 
 	KASSERT(map->flags & DMAMAP_DMAMEM_ALLOC ||
 	    dmat->alignment <= PAGE_SIZE,
 	    ("%s: unsupported alignment (0x%08lx) for buffer not "
 	    "allocated by bus_dmamem_alloc()",
 	    __func__, dmat->alignment));
 
 	return (!(map->flags & DMAMAP_DMAMEM_ALLOC) &&
 	    ((dmat->flags & BUS_DMA_EXCL_BOUNCE) ||
 	    alignment_bounce(dmat, addr) ||
 	    cacheline_bounce(map, addr, size)));
 }
 
 /*
  * Return true if we must bounce the DMA described by paddr and size.
  *
  * Bouncing can be triggered by DMA that doesn't begin and end on cacheline
  * boundaries, or doesn't begin on an alignment boundary, or falls within the
  * exclusion zone of any tag in the ancestry chain.
  *
  * For exclusions, walk the chain of tags comparing paddr to the exclusion zone
  * within each tag.  If the tag has a filter function, use it to decide whether
  * the DMA needs to bounce, otherwise any DMA within the zone bounces.
  */
 static int
 must_bounce(bus_dma_tag_t dmat, bus_dmamap_t map, bus_addr_t paddr,
     bus_size_t size)
 {
 
 	if (cacheline_bounce(map, paddr, size))
 		return (1);
 
 	/*
 	 *  The tag already contains ancestors' alignment restrictions so this
 	 *  check doesn't need to be inside the loop.
 	 */
 	if (alignment_bounce(dmat, paddr))
 		return (1);
 
 	/*
 	 * Even though each tag has an exclusion zone that is a superset of its
 	 * own and all its ancestors' exclusions, the exclusion zone of each tag
 	 * up the chain must be checked within the loop, because the busdma
 	 * rules say the filter function is called only when the address lies
 	 * within the low-highaddr range of the tag that filterfunc belongs to.
 	 */
 	while (dmat != NULL && exclusion_bounce(dmat)) {
 		if ((paddr >= dmat->lowaddr && paddr <= dmat->highaddr) &&
 		    (dmat->filter == NULL ||
 		    dmat->filter(dmat->filterarg, paddr) != 0))
 			return (1);
 		dmat = dmat->parent;
 	}
 
 	return (0);
 }
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 static void
 dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 
 	panic("driver error: busdma dflt_lock called");
 }
 
 /*
  * Allocate a device specific dma_tag.
  */
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
     bus_addr_t boundary, bus_addr_t lowaddr, bus_addr_t highaddr,
     bus_dma_filter_t *filter, void *filterarg, bus_size_t maxsize,
     int nsegments, bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
     void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	bus_dma_tag_t newtag;
 	int error = 0;
 
 	/* Basic sanity checking. */
 	KASSERT(boundary == 0 || powerof2(boundary),
 	    ("dma tag boundary %lu, must be a power of 2", boundary));
 	KASSERT(boundary == 0 || boundary >= maxsegsz,
 	    ("dma tag boundary %lu is < maxsegsz %lu\n", boundary, maxsegsz));
 	KASSERT(alignment != 0 && powerof2(alignment),
 	    ("dma tag alignment %lu, must be non-zero power of 2", alignment));
 	KASSERT(maxsegsz != 0, ("dma tag maxsegsz must not be zero"));
 
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 
 	newtag = (bus_dma_tag_t)malloc(sizeof(*newtag), M_BUSDMA,
 	    M_ZERO | M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, error);
 		return (ENOMEM);
 	}
 
 	newtag->parent = parent;
 	newtag->alignment = alignment;
 	newtag->boundary = boundary;
 	newtag->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
 	newtag->highaddr = trunc_page((vm_paddr_t)highaddr) +
 	    (PAGE_SIZE - 1);
 	newtag->filter = filter;
 	newtag->filterarg = filterarg;
 	newtag->maxsize = maxsize;
 	newtag->nsegments = nsegments;
 	newtag->maxsegsz = maxsegsz;
 	newtag->flags = flags;
 	newtag->ref_count = 1; /* Count ourself */
 	newtag->map_count = 0;
 	if (lockfunc != NULL) {
 		newtag->lockfunc = lockfunc;
 		newtag->lockfuncarg = lockfuncarg;
 	} else {
 		newtag->lockfunc = dflt_lock;
 		newtag->lockfuncarg = NULL;
 	}
 
 	/* Take into account any restrictions imposed by our parent tag */
 	if (parent != NULL) {
 		newtag->lowaddr = MIN(parent->lowaddr, newtag->lowaddr);
 		newtag->highaddr = MAX(parent->highaddr, newtag->highaddr);
 		newtag->alignment = MAX(parent->alignment, newtag->alignment);
 		newtag->flags |= parent->flags & BUS_DMA_COULD_BOUNCE;
 		newtag->flags |= parent->flags & BUS_DMA_COHERENT;
 		if (newtag->boundary == 0)
 			newtag->boundary = parent->boundary;
 		else if (parent->boundary != 0)
 			newtag->boundary = MIN(parent->boundary,
 					       newtag->boundary);
 		if (newtag->filter == NULL) {
 			/*
 			 * Short circuit to looking at our parent directly
 			 * since we have encapsulated all of its information
 			 */
 			newtag->filter = parent->filter;
 			newtag->filterarg = parent->filterarg;
 			newtag->parent = parent->parent;
 		}
 		if (newtag->parent != NULL)
 			atomic_add_int(&parent->ref_count, 1);
 	}
 
 	if (exclusion_bounce_check(newtag->lowaddr, newtag->highaddr))
 		newtag->flags |= BUS_DMA_EXCL_BOUNCE;
 	if (alignment_bounce(newtag, 1))
 		newtag->flags |= BUS_DMA_ALIGN_BOUNCE;
 
 	/*
 	 * Any request can auto-bounce due to cacheline alignment, in addition
 	 * to any alignment or boundary specifications in the tag, so if the
 	 * ALLOCNOW flag is set, there's always work to do.
 	 */
 	if ((flags & BUS_DMA_ALLOCNOW) != 0) {
 		struct bounce_zone *bz;
 		/*
 		 * Round size up to a full page, and add one more page because
 		 * there can always be one more boundary crossing than the
 		 * number of pages in a transfer.
 		 */
 		maxsize = roundup2(maxsize, PAGE_SIZE) + PAGE_SIZE;
 
 		if ((error = alloc_bounce_zone(newtag)) != 0) {
 			free(newtag, M_BUSDMA);
 			return (error);
 		}
 		bz = newtag->bounce_zone;
 
 		if (ptoa(bz->total_bpages) < maxsize) {
 			int pages;
 
 			pages = atop(maxsize) - bz->total_bpages;
 
 			/* Add pages to our bounce pool */
 			if (alloc_bounce_pages(newtag, pages) < pages)
 				error = ENOMEM;
 		}
 		/* Performed initial allocation */
 		newtag->flags |= BUS_DMA_MIN_ALLOC_COMP;
 	} else
 		newtag->bounce_zone = NULL;
 
 	if (error != 0) {
 		free(newtag, M_BUSDMA);
 	} else {
 		atomic_add_32(&tags_total, 1);
 		*dmat = newtag;
 	}
 	CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 	    __func__, newtag, (newtag != NULL ? newtag->flags : 0), error);
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	t->parent = dmat->parent;
 	t->alignment = dmat->alignment;
 	t->boundary = dmat->boundary;
 	t->lowaddr = dmat->lowaddr;
 	t->highaddr = dmat->highaddr;
 	t->maxsize = dmat->maxsize;
 	t->nsegments = dmat->nsegments;
 	t->maxsegsize = dmat->maxsegsz;
 	t->flags = dmat->flags;
 	t->lockfunc = dmat->lockfunc;
 	t->lockfuncarg = dmat->lockfuncarg;
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 
 	return (0);
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 	bus_dma_tag_t dmat_copy;
 	int error;
 
 	error = 0;
 	dmat_copy = dmat;
 
 	if (dmat != NULL) {
 		if (dmat->map_count != 0) {
 			error = EBUSY;
 			goto out;
 		}
 
 		while (dmat != NULL) {
 			bus_dma_tag_t parent;
 
 			parent = dmat->parent;
 			atomic_subtract_int(&dmat->ref_count, 1);
 			if (dmat->ref_count == 0) {
 				atomic_subtract_32(&tags_total, 1);
 				free(dmat, M_BUSDMA);
 				/*
 				 * Last reference count, so
 				 * release our reference
 				 * count on our parent.
 				 */
 				dmat = parent;
 			} else
 				dmat = NULL;
 		}
 	}
 out:
 	CTR3(KTR_BUSDMA, "%s tag %p error %d", __func__, dmat_copy, error);
 	return (error);
 }
 
 static int
 allocate_bz_and_pages(bus_dma_tag_t dmat, bus_dmamap_t mapp)
 {
 	struct bounce_zone *bz;
 	int maxpages;
 	int error;
 
 	if (dmat->bounce_zone == NULL)
 		if ((error = alloc_bounce_zone(dmat)) != 0)
 			return (error);
 	bz = dmat->bounce_zone;
 	/* Initialize the new map */
 	STAILQ_INIT(&(mapp->bpages));
 
 	/*
 	 * Attempt to add pages to our pool on a per-instance basis up to a sane
 	 * limit.  Even if the tag isn't flagged as COULD_BOUNCE due to
 	 * alignment and boundary constraints, it could still auto-bounce due to
 	 * cacheline alignment, which requires at most two bounce pages.
 	 */
 	if (dmat->flags & BUS_DMA_COULD_BOUNCE)
 		maxpages = MAX_BPAGES;
 	else
 		maxpages = 2 * bz->map_count;
 	if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0 ||
 	    (bz->map_count > 0 && bz->total_bpages < maxpages)) {
 		int pages;
 
 		pages = atop(roundup2(dmat->maxsize, PAGE_SIZE)) + 1;
 		pages = MIN(maxpages - bz->total_bpages, pages);
 		pages = MAX(pages, 2);
 		if (alloc_bounce_pages(dmat, pages) < pages)
 			return (ENOMEM);
 
 		if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0)
 			dmat->flags |= BUS_DMA_MIN_ALLOC_COMP;
 	}
 	bz->map_count++;
 	return (0);
 }
 
 static bus_dmamap_t
 allocate_map(bus_dma_tag_t dmat, int mflags)
 {
 	int mapsize, segsize;
 	bus_dmamap_t map;
 
 	/*
 	 * Allocate the map.  The map structure ends with an embedded
 	 * variable-sized array of sync_list structures.  Following that
 	 * we allocate enough extra space to hold the array of bus_dma_segments.
 	 */
 	KASSERT(dmat->nsegments <= MAX_DMA_SEGMENTS,
 	   ("cannot allocate %u dma segments (max is %u)",
 	    dmat->nsegments, MAX_DMA_SEGMENTS));
 	segsize = sizeof(struct bus_dma_segment) * dmat->nsegments;
 	mapsize = sizeof(*map) + sizeof(struct sync_list) * dmat->nsegments;
 	map = malloc(mapsize + segsize, M_BUSDMA, mflags | M_ZERO);
 	if (map == NULL) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d", __func__, dmat, ENOMEM);
 		return (NULL);
 	}
 	map->segments = (bus_dma_segment_t *)((uintptr_t)map + mapsize);
 	STAILQ_INIT(&map->bpages);
 	return (map);
 }
 
 /*
  * Allocate a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_create(bus_dma_tag_t dmat, int flags, bus_dmamap_t *mapp)
 {
 	bus_dmamap_t map;
 	int error = 0;
 
 	*mapp = map = allocate_map(dmat, M_NOWAIT);
 	if (map == NULL) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d", __func__, dmat, ENOMEM);
 		return (ENOMEM);
 	}
 
 	/*
 	 * Bouncing might be required if the driver asks for an exclusion
 	 * region, a data alignment that is stricter than 1, or DMA that begins
 	 * or ends with a partial cacheline.  Whether bouncing will actually
 	 * happen can't be known until mapping time, but we need to pre-allocate
 	 * resources now because we might not be allowed to at mapping time.
 	 */
 	error = allocate_bz_and_pages(dmat, map);
 	if (error != 0) {
 		free(map, M_BUSDMA);
 		*mapp = NULL;
 		return (error);
 	}
 	if (map->flags & DMAMAP_COHERENT)
 		atomic_add_32(&maps_coherent, 1);
 	atomic_add_32(&maps_total, 1);
 	dmat->map_count++;
 
 	return (0);
 }
 
 /*
  * Destroy a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_destroy(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 
 	if (STAILQ_FIRST(&map->bpages) != NULL || map->sync_count != 0) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 		    __func__, dmat, EBUSY);
 		return (EBUSY);
 	}
 	if (dmat->bounce_zone)
 		dmat->bounce_zone->map_count--;
 	if (map->flags & DMAMAP_COHERENT)
 		atomic_subtract_32(&maps_coherent, 1);
 	atomic_subtract_32(&maps_total, 1);
 	free(map, M_BUSDMA);
 	dmat->map_count--;
 	CTR2(KTR_BUSDMA, "%s: tag %p error 0", __func__, dmat);
 	return (0);
 }
 
 /*
  * Allocate a piece of memory that can be efficiently mapped into bus device
  * space based on the constraints listed in the dma tag.  Returns a pointer to
  * the allocated memory, and a pointer to an associated bus_dmamap.
  */
 int
 bus_dmamem_alloc(bus_dma_tag_t dmat, void **vaddr, int flags,
     bus_dmamap_t *mapp)
 {
 	busdma_bufalloc_t ba;
 	struct busdma_bufzone *bufzone;
 	bus_dmamap_t map;
 	vm_memattr_t memattr;
 	int mflags;
 
 	if (flags & BUS_DMA_NOWAIT)
 		mflags = M_NOWAIT;
 	else
 		mflags = M_WAITOK;
 	if (flags & BUS_DMA_ZERO)
 		mflags |= M_ZERO;
 
 	*mapp = map = allocate_map(dmat, mflags);
 	if (map == NULL) {
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 		    __func__, dmat, dmat->flags, ENOMEM);
 		return (ENOMEM);
 	}
 	map->flags = DMAMAP_DMAMEM_ALLOC;
 
 	/* For coherent memory, set the map flag that disables sync ops. */
 	if (flags & BUS_DMA_COHERENT)
 		map->flags |= DMAMAP_COHERENT;
 
 	/*
 	 * Choose a busdma buffer allocator based on memory type flags.
 	 * If the tag's COHERENT flag is set, that means normal memory
 	 * is already coherent, use the normal allocator.
 	 */
 	if ((flags & BUS_DMA_COHERENT) &&
 	    ((dmat->flags & BUS_DMA_COHERENT) == 0)) {
 		memattr = VM_MEMATTR_UNCACHEABLE;
 		ba = coherent_allocator;
 	} else {
 		memattr = VM_MEMATTR_DEFAULT;
 		ba = standard_allocator;
 	}
 
 	/*
 	 * Try to find a bufzone in the allocator that holds a cache of buffers
 	 * of the right size for this request.  If the buffer is too big to be
 	 * held in the allocator cache, this returns NULL.
 	 */
 	bufzone = busdma_bufalloc_findzone(ba, dmat->maxsize);
 
 	/*
 	 * Allocate the buffer from the uma(9) allocator if...
 	 *  - It's small enough to be in the allocator (bufzone not NULL).
 	 *  - The alignment constraint isn't larger than the allocation size
 	 *    (the allocator aligns buffers to their size boundaries).
 	 *  - There's no need to handle lowaddr/highaddr exclusion zones.
 	 * else allocate non-contiguous pages if...
 	 *  - The page count that could get allocated doesn't exceed
 	 *    nsegments also when the maximum segment size is less
 	 *    than PAGE_SIZE.
 	 *  - The alignment constraint isn't larger than a page boundary.
 	 *  - There are no boundary-crossing constraints.
 	 * else allocate a block of contiguous pages because one or more of the
 	 * constraints is something that only the contig allocator can fulfill.
 	 */
 	if (bufzone != NULL && dmat->alignment <= bufzone->size &&
 	    !exclusion_bounce(dmat)) {
 		*vaddr = uma_zalloc(bufzone->umazone, mflags);
 	} else if (dmat->nsegments >=
 	    howmany(dmat->maxsize, MIN(dmat->maxsegsz, PAGE_SIZE)) &&
 	    dmat->alignment <= PAGE_SIZE &&
 	    (dmat->boundary % PAGE_SIZE) == 0) {
 		*vaddr = (void *)kmem_alloc_attr(dmat->maxsize, mflags, 0,
 		    dmat->lowaddr, memattr);
 	} else {
 		*vaddr = (void *)kmem_alloc_contig(dmat->maxsize, mflags, 0,
 		    dmat->lowaddr, dmat->alignment, dmat->boundary, memattr);
 	}
 	if (*vaddr == NULL) {
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 		    __func__, dmat, dmat->flags, ENOMEM);
 		free(map, M_BUSDMA);
 		*mapp = NULL;
 		return (ENOMEM);
 	}
 	if (map->flags & DMAMAP_COHERENT)
 		atomic_add_32(&maps_coherent, 1);
 	atomic_add_32(&maps_dmamem, 1);
 	atomic_add_32(&maps_total, 1);
 	dmat->map_count++;
 
 	CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 	    __func__, dmat, dmat->flags, 0);
 	return (0);
 }
 
 /*
  * Free a piece of memory that was allocated via bus_dmamem_alloc, along with
  * its associated map.
  */
 void
 bus_dmamem_free(bus_dma_tag_t dmat, void *vaddr, bus_dmamap_t map)
 {
 	struct busdma_bufzone *bufzone;
 	busdma_bufalloc_t ba;
 
 	if ((map->flags & DMAMAP_COHERENT) &&
 	    ((dmat->flags & BUS_DMA_COHERENT) == 0))
 		ba = coherent_allocator;
 	else
 		ba = standard_allocator;
 
 	bufzone = busdma_bufalloc_findzone(ba, dmat->maxsize);
 
 	if (bufzone != NULL && dmat->alignment <= bufzone->size &&
 	    !exclusion_bounce(dmat))
 		uma_zfree(bufzone->umazone, vaddr);
 	else
 		kmem_free((vm_offset_t)vaddr, dmat->maxsize);
 
 	dmat->map_count--;
 	if (map->flags & DMAMAP_COHERENT)
 		atomic_subtract_32(&maps_coherent, 1);
 	atomic_subtract_32(&maps_total, 1);
 	atomic_subtract_32(&maps_dmamem, 1);
 	free(map, M_BUSDMA);
 	CTR3(KTR_BUSDMA, "%s: tag %p flags 0x%x", __func__, dmat, dmat->flags);
 }
 
 static void
 _bus_dmamap_count_phys(bus_dma_tag_t dmat, bus_dmamap_t map, vm_paddr_t buf,
     bus_size_t buflen, int flags)
 {
 	bus_addr_t curaddr;
 	bus_size_t sgsize;
 
 	if (map->pagesneeded == 0) {
 		CTR5(KTR_BUSDMA, "lowaddr= %d, boundary= %d, alignment= %d"
 		    " map= %p, pagesneeded= %d",
 		    dmat->lowaddr, dmat->boundary, dmat->alignment,
 		    map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		curaddr = buf;
 		while (buflen != 0) {
 			sgsize = MIN(buflen, dmat->maxsegsz);
 			if (must_bounce(dmat, map, curaddr, sgsize) != 0) {
 				sgsize = MIN(sgsize,
 				    PAGE_SIZE - (curaddr & PAGE_MASK));
 				map->pagesneeded++;
 			}
 			curaddr += sgsize;
 			buflen -= sgsize;
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d", map->pagesneeded);
 	}
 }
 
 static void
 _bus_dmamap_count_pages(bus_dma_tag_t dmat, pmap_t pmap, bus_dmamap_t map,
     void *buf, bus_size_t buflen, int flags)
 {
 	vm_offset_t vaddr;
 	vm_offset_t vendaddr;
 	bus_addr_t paddr;
 
 	if (map->pagesneeded == 0) {
 		CTR5(KTR_BUSDMA, "lowaddr= %d, boundary= %d, alignment= %d"
 		    " map= %p, pagesneeded= %d",
 		    dmat->lowaddr, dmat->boundary, dmat->alignment,
 		    map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		vaddr = (vm_offset_t)buf;
 		vendaddr = (vm_offset_t)buf + buflen;
 
 		while (vaddr < vendaddr) {
 			if (__predict_true(pmap == kernel_pmap))
 				paddr = pmap_kextract(vaddr);
 			else
 				paddr = pmap_extract(pmap, vaddr);
 			if (must_bounce(dmat, map, paddr,
 			    min(vendaddr - vaddr, (PAGE_SIZE - ((vm_offset_t)vaddr &
 			    PAGE_MASK)))) != 0) {
 				map->pagesneeded++;
 			}
 			vaddr += (PAGE_SIZE - ((vm_offset_t)vaddr & PAGE_MASK));
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d", map->pagesneeded);
 	}
 }
 
 static int
 _bus_dmamap_reserve_pages(bus_dma_tag_t dmat, bus_dmamap_t map, int flags)
 {
 
 	/* Reserve Necessary Bounce Pages */
 	mtx_lock(&bounce_lock);
 	if (flags & BUS_DMA_NOWAIT) {
 		if (reserve_bounce_pages(dmat, map, 0) != 0) {
 			map->pagesneeded = 0;
 			mtx_unlock(&bounce_lock);
 			return (ENOMEM);
 		}
 	} else {
 		if (reserve_bounce_pages(dmat, map, 1) != 0) {
 			/* Queue us for resources */
 			STAILQ_INSERT_TAIL(&bounce_map_waitinglist, map, links);
 			mtx_unlock(&bounce_lock);
 			return (EINPROGRESS);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 
 	return (0);
 }
 
 /*
  * Add a single contiguous physical range to the segment list.
  */
 static int
 _bus_dmamap_addseg(bus_dma_tag_t dmat, bus_dmamap_t map, bus_addr_t curaddr,
     bus_size_t sgsize, bus_dma_segment_t *segs, int *segp)
 {
 	bus_addr_t baddr, bmask;
 	int seg;
 
 	/*
 	 * Make sure we don't cross any boundaries.
 	 */
 	bmask = ~(dmat->boundary - 1);
 	if (dmat->boundary > 0) {
 		baddr = (curaddr + dmat->boundary) & bmask;
 		if (sgsize > (baddr - curaddr))
 			sgsize = (baddr - curaddr);
 	}
 
 	/*
 	 * Insert chunk into a segment, coalescing with
 	 * previous segment if possible.
 	 */
 	seg = *segp;
 	if (seg == -1) {
 		seg = 0;
 		segs[seg].ds_addr = curaddr;
 		segs[seg].ds_len = sgsize;
 	} else {
 		if (curaddr == segs[seg].ds_addr + segs[seg].ds_len &&
 		    (segs[seg].ds_len + sgsize) <= dmat->maxsegsz &&
 		    (dmat->boundary == 0 ||
 		    (segs[seg].ds_addr & bmask) == (curaddr & bmask)))
 			segs[seg].ds_len += sgsize;
 		else {
 			if (++seg >= dmat->nsegments)
 				return (0);
 			segs[seg].ds_addr = curaddr;
 			segs[seg].ds_len = sgsize;
 		}
 	}
 	*segp = seg;
 	return (sgsize);
 }
 
 /*
  * Utility function to load a physical buffer.  segp contains
  * the starting segment on entrace, and the ending segment on exit.
  */
 int
 _bus_dmamap_load_phys(bus_dma_tag_t dmat, bus_dmamap_t map, vm_paddr_t buf,
     bus_size_t buflen, int flags, bus_dma_segment_t *segs, int *segp)
 {
 	bus_addr_t curaddr;
 	bus_addr_t sl_end = 0;
 	bus_size_t sgsize;
 	struct sync_list *sl;
 	int error;
 
 	if (segs == NULL)
 		segs = map->segments;
 
 	counter_u64_add(maploads_total, 1);
 	counter_u64_add(maploads_physmem, 1);
 
 	if (might_bounce(dmat, map, (bus_addr_t)buf, buflen)) {
 		_bus_dmamap_count_phys(dmat, map, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			counter_u64_add(maploads_bounced, 1);
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 
 	sl = map->slist + map->sync_count - 1;
 
 	while (buflen > 0) {
 		curaddr = buf;
 		sgsize = MIN(buflen, dmat->maxsegsz);
 		if (map->pagesneeded != 0 && must_bounce(dmat, map, curaddr,
 		    sgsize)) {
 			sgsize = MIN(sgsize, PAGE_SIZE - (curaddr & PAGE_MASK));
 			curaddr = add_bounce_page(dmat, map, 0, curaddr,
 			    sgsize);
 		} else if ((dmat->flags & BUS_DMA_COHERENT) == 0) {
 			if (map->sync_count > 0)
 				sl_end = sl->paddr + sl->datacount;
 
 			if (map->sync_count == 0 || curaddr != sl_end) {
 				if (++map->sync_count > dmat->nsegments)
 					break;
 				sl++;
 				sl->vaddr = 0;
 				sl->paddr = curaddr;
 				sl->datacount = sgsize;
 				sl->pages = PHYS_TO_VM_PAGE(curaddr);
 				KASSERT(sl->pages != NULL,
 				    ("%s: page at PA:0x%08lx is not in "
 				    "vm_page_array", __func__, curaddr));
 			} else
 				sl->datacount += sgsize;
 		}
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		buf += sgsize;
 		buflen -= sgsize;
 	}
 
 	/*
 	 * Did we fit?
 	 */
 	if (buflen != 0) {
 		bus_dmamap_unload(dmat, map);
 		return (EFBIG); /* XXX better return value here? */
 	}
 	return (0);
 }
 
 int
 _bus_dmamap_load_ma(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct vm_page **ma, bus_size_t tlen, int ma_offs, int flags,
     bus_dma_segment_t *segs, int *segp)
 {
 
 	return (bus_dmamap_load_ma_triv(dmat, map, ma, tlen, ma_offs, flags,
 	    segs, segp));
 }
 
 /*
  * Utility function to load a linear buffer.  segp contains
  * the starting segment on entrance, and the ending segment on exit.
  */
 int
 _bus_dmamap_load_buffer(bus_dma_tag_t dmat, bus_dmamap_t map, void *buf,
     bus_size_t buflen, pmap_t pmap, int flags, bus_dma_segment_t *segs,
     int *segp)
 {
 	bus_size_t sgsize;
 	bus_addr_t curaddr;
 	bus_addr_t sl_pend = 0;
 	vm_offset_t kvaddr, vaddr, sl_vend = 0;
 	struct sync_list *sl;
 	int error;
 
 	counter_u64_add(maploads_total, 1);
 	if (map->flags & DMAMAP_COHERENT)
 		counter_u64_add(maploads_coherent, 1);
 	if (map->flags & DMAMAP_DMAMEM_ALLOC)
 		counter_u64_add(maploads_dmamem, 1);
 
 	if (segs == NULL)
 		segs = map->segments;
 
 	if (flags & BUS_DMA_LOAD_MBUF) {
 		counter_u64_add(maploads_mbuf, 1);
 		map->flags |= DMAMAP_MBUF;
 	}
 
 	if (might_bounce(dmat, map, (bus_addr_t)buf, buflen)) {
 		_bus_dmamap_count_pages(dmat, pmap, map, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			counter_u64_add(maploads_bounced, 1);
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 
 	sl = map->slist + map->sync_count - 1;
 	vaddr = (vm_offset_t)buf;
 
 	while (buflen > 0) {
 		/*
 		 * Get the physical address for this segment.
 		 */
 		if (__predict_true(pmap == kernel_pmap)) {
 			curaddr = pmap_kextract(vaddr);
 			kvaddr = vaddr;
 		} else {
 			curaddr = pmap_extract(pmap, vaddr);
 			kvaddr = 0;
 		}
 
 		/*
 		 * Compute the segment size, and adjust counts.
 		 */
 		sgsize = PAGE_SIZE - (curaddr & PAGE_MASK);
 		if (sgsize > dmat->maxsegsz)
 			sgsize = dmat->maxsegsz;
 		if (buflen < sgsize)
 			sgsize = buflen;
 
 		if (map->pagesneeded != 0 && must_bounce(dmat, map, curaddr,
 		    sgsize)) {
 			curaddr = add_bounce_page(dmat, map, kvaddr, curaddr,
 			    sgsize);
 		} else if ((dmat->flags & BUS_DMA_COHERENT) == 0) {
 			if (map->sync_count > 0) {
 				sl_pend = sl->paddr + sl->datacount;
 				sl_vend = sl->vaddr + sl->datacount;
 			}
 
 			if (map->sync_count == 0 ||
 			    (kvaddr != 0 && kvaddr != sl_vend) ||
 			    (curaddr != sl_pend)) {
 				if (++map->sync_count > dmat->nsegments)
 					goto cleanup;
 				sl++;
 				sl->vaddr = kvaddr;
 				sl->paddr = curaddr;
 				if (kvaddr != 0) {
 					sl->pages = NULL;
 				} else {
 					sl->pages = PHYS_TO_VM_PAGE(curaddr);
 					KASSERT(sl->pages != NULL,
 					    ("%s: page at PA:0x%08lx is not "
 					    "in vm_page_array", __func__,
 					    curaddr));
 				}
 				sl->datacount = sgsize;
 			} else
 				sl->datacount += sgsize;
 		}
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		vaddr += sgsize;
 		buflen -= sgsize;
 	}
 
 cleanup:
 	/*
 	 * Did we fit?
 	 */
 	if (buflen != 0) {
 		bus_dmamap_unload(dmat, map);
 		return (EFBIG); /* XXX better return value here? */
 	}
 	return (0);
 }
 
 void
 _bus_dmamap_waitok(bus_dma_tag_t dmat, bus_dmamap_t map, struct memdesc *mem,
     bus_dmamap_callback_t *callback, void *callback_arg)
 {
 
 	map->mem = *mem;
 	map->dmat = dmat;
 	map->callback = callback;
 	map->callback_arg = callback_arg;
 }
 
 bus_dma_segment_t *
 _bus_dmamap_complete(bus_dma_tag_t dmat, bus_dmamap_t map,
     bus_dma_segment_t *segs, int nsegs, int error)
 {
 
 	if (segs == NULL)
 		segs = map->segments;
 	return (segs);
 }
 
 /*
  * Release the mapping held by map.
  */
 void
 bus_dmamap_unload(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 	struct bounce_page *bpage;
 	struct bounce_zone *bz;
 
 	if ((bz = dmat->bounce_zone) != NULL) {
 		while ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
 			STAILQ_REMOVE_HEAD(&map->bpages, links);
 			free_bounce_page(dmat, bpage);
 		}
 
 		bz = dmat->bounce_zone;
 		bz->free_bpages += map->pagesreserved;
 		bz->reserved_bpages -= map->pagesreserved;
 		map->pagesreserved = 0;
 		map->pagesneeded = 0;
 	}
 	map->sync_count = 0;
 	map->flags &= ~DMAMAP_MBUF;
 }
 
 static void
 dma_preread_safe(vm_offset_t va, vm_paddr_t pa, vm_size_t size)
 {
 	/*
 	 * Write back any partial cachelines immediately before and
 	 * after the DMA region.  We don't need to round the address
 	 * down to the nearest cacheline or specify the exact size,
 	 * as dcache_wb_poc() will do the rounding for us and works
 	 * at cacheline granularity.
 	 */
 	if (va & BUSDMA_DCACHE_MASK)
 		dcache_wb_poc(va, pa, 1);
 	if ((va + size) & BUSDMA_DCACHE_MASK)
 		dcache_wb_poc(va + size, pa + size, 1);
 
 	dcache_inv_poc_dma(va, pa, size);
 }
 
 static void
 dma_dcache_sync(struct sync_list *sl, bus_dmasync_op_t op)
 {
 	uint32_t len, offset;
 	vm_page_t m;
 	vm_paddr_t pa;
 	vm_offset_t va, tempva;
 	bus_size_t size;
 
 	offset = sl->paddr & PAGE_MASK;
 	m = sl->pages;
 	size = sl->datacount;
 	pa = sl->paddr;
 
 	for ( ; size != 0; size -= len, pa += len, offset = 0, ++m) {
 		tempva = 0;
 		if (sl->vaddr == 0) {
 			len = min(PAGE_SIZE - offset, size);
 			tempva = pmap_quick_enter_page(m);
 			va = tempva | offset;
 			KASSERT(pa == (VM_PAGE_TO_PHYS(m) | offset),
 			    ("unexpected vm_page_t phys: 0x%08x != 0x%08x",
 			    VM_PAGE_TO_PHYS(m) | offset, pa));
 		} else {
 			len = sl->datacount;
 			va = sl->vaddr;
 		}
 
 		switch (op) {
 		case BUS_DMASYNC_PREWRITE:
 		case BUS_DMASYNC_PREWRITE | BUS_DMASYNC_PREREAD:
 			dcache_wb_poc(va, pa, len);
 			break;
 		case BUS_DMASYNC_PREREAD:
 			/*
 			 * An mbuf may start in the middle of a cacheline. There
 			 * will be no cpu writes to the beginning of that line
 			 * (which contains the mbuf header) while dma is in
 			 * progress.  Handle that case by doing a writeback of
 			 * just the first cacheline before invalidating the
 			 * overall buffer.  Any mbuf in a chain may have this
 			 * misalignment.  Buffers which are not mbufs bounce if
 			 * they are not aligned to a cacheline.
 			 */
 			dma_preread_safe(va, pa, len);
 			break;
 		case BUS_DMASYNC_POSTREAD:
 		case BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE:
 			dcache_inv_poc(va, pa, len);
 			break;
 		default:
 			panic("unsupported combination of sync operations: "
                               "0x%08x\n", op);
 		}
 
 		if (tempva != 0)
 			pmap_quick_remove_page(tempva);
 	}
 }
 
 void
 bus_dmamap_sync(bus_dma_tag_t dmat, bus_dmamap_t map, bus_dmasync_op_t op)
 {
 	struct bounce_page *bpage;
 	struct sync_list *sl, *end;
 	vm_offset_t datavaddr, tempvaddr;
 
 	if (op == BUS_DMASYNC_POSTWRITE)
 		return;
 
 	/*
 	 * If the buffer was from user space, it is possible that this is not
 	 * the same vm map, especially on a POST operation.  It's not clear that
 	 * dma on userland buffers can work at all right now.  To be safe, until
 	 * we're able to test direct userland dma, panic on a map mismatch.
 	 */
 	if ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x op 0x%x "
 		    "performing bounce", __func__, dmat, dmat->flags, op);
 
 		/*
 		 * For PREWRITE do a writeback.  Clean the caches from the
 		 * innermost to the outermost levels.
 		 */
 		if (op & BUS_DMASYNC_PREWRITE) {
 			while (bpage != NULL) {
 				tempvaddr = 0;
 				datavaddr = bpage->datavaddr;
 				if (datavaddr == 0) {
 					tempvaddr = pmap_quick_enter_page(
 					    bpage->datapage);
 					datavaddr = tempvaddr | bpage->dataoffs;
 				}
 				bcopy((void *)datavaddr, (void *)bpage->vaddr,
 				    bpage->datacount);
 				if (tempvaddr != 0)
 					pmap_quick_remove_page(tempvaddr);
 				if ((dmat->flags & BUS_DMA_COHERENT) == 0)
 					dcache_wb_poc(bpage->vaddr,
 					    bpage->busaddr, bpage->datacount);
 				bpage = STAILQ_NEXT(bpage, links);
 			}
 			dmat->bounce_zone->total_bounced++;
 		}
 
 		/*
 		 * Do an invalidate for PREREAD unless a writeback was already
 		 * done above due to PREWRITE also being set.  The reason for a
 		 * PREREAD invalidate is to prevent dirty lines currently in the
 		 * cache from being evicted during the DMA.  If a writeback was
 		 * done due to PREWRITE also being set there will be no dirty
 		 * lines and the POSTREAD invalidate handles the rest. The
 		 * invalidate is done from the innermost to outermost level. If
 		 * L2 were done first, a dirty cacheline could be automatically
 		 * evicted from L1 before we invalidated it, re-dirtying the L2.
 		 */
 		if ((op & BUS_DMASYNC_PREREAD) && !(op & BUS_DMASYNC_PREWRITE)) {
 			bpage = STAILQ_FIRST(&map->bpages);
 			while (bpage != NULL) {
 				if ((dmat->flags & BUS_DMA_COHERENT) == 0)
 					dcache_inv_poc_dma(bpage->vaddr,
 					    bpage->busaddr, bpage->datacount);
 				bpage = STAILQ_NEXT(bpage, links);
 			}
 		}
 
 		/*
 		 * Re-invalidate the caches on a POSTREAD, even though they were
 		 * already invalidated at PREREAD time.  Aggressive prefetching
 		 * due to accesses to other data near the dma buffer could have
 		 * brought buffer data into the caches which is now stale.  The
 		 * caches are invalidated from the outermost to innermost; the
 		 * prefetches could be happening right now, and if L1 were
 		 * invalidated first, stale L2 data could be prefetched into L1.
 		 */
 		if (op & BUS_DMASYNC_POSTREAD) {
 			while (bpage != NULL) {
 				if ((dmat->flags & BUS_DMA_COHERENT) == 0)
 					dcache_inv_poc(bpage->vaddr,
 					    bpage->busaddr, bpage->datacount);
 				tempvaddr = 0;
 				datavaddr = bpage->datavaddr;
 				if (datavaddr == 0) {
 					tempvaddr = pmap_quick_enter_page(
 					    bpage->datapage);
 					datavaddr = tempvaddr | bpage->dataoffs;
 				}
 				bcopy((void *)bpage->vaddr, (void *)datavaddr,
 				    bpage->datacount);
 				if (tempvaddr != 0)
 					pmap_quick_remove_page(tempvaddr);
 				bpage = STAILQ_NEXT(bpage, links);
 			}
 			dmat->bounce_zone->total_bounced++;
 		}
 	}
 
 	/*
 	 * For COHERENT memory no cache maintenance is necessary, but ensure all
 	 * writes have reached memory for the PREWRITE case.  No action is
 	 * needed for a PREREAD without PREWRITE also set, because that would
 	 * imply that the cpu had written to the COHERENT buffer and expected
 	 * the dma device to see that change, and by definition a PREWRITE sync
 	 * is required to make that happen.
 	 */
 	if (map->flags & DMAMAP_COHERENT) {
 		if (op & BUS_DMASYNC_PREWRITE) {
 			dsb();
 			if ((dmat->flags & BUS_DMA_COHERENT) == 0)
 				cpu_l2cache_drain_writebuf();
 		}
 		return;
 	}
 
 	/*
 	 * Cache maintenance for normal (non-COHERENT non-bounce) buffers.  All
 	 * the comments about the sequences for flushing cache levels in the
 	 * bounce buffer code above apply here as well.  In particular, the fact
 	 * that the sequence is inner-to-outer for PREREAD invalidation and
 	 * outer-to-inner for POSTREAD invalidation is not a mistake.
 	 */
 	if (map->sync_count != 0) {
 		sl = &map->slist[0];
 		end = &map->slist[map->sync_count];
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x op 0x%x "
 		    "performing sync", __func__, dmat, dmat->flags, op);
 
 		for ( ; sl != end; ++sl)
 			dma_dcache_sync(sl, op);
 	}
 }
 
 static void
 init_bounce_pages(void *dummy __unused)
 {
 
 	total_bpages = 0;
 	STAILQ_INIT(&bounce_zone_list);
 	STAILQ_INIT(&bounce_map_waitinglist);
 	STAILQ_INIT(&bounce_map_callbacklist);
 	mtx_init(&bounce_lock, "bounce pages lock", NULL, MTX_DEF);
 }
 SYSINIT(bpages, SI_SUB_LOCK, SI_ORDER_ANY, init_bounce_pages, NULL);
 
 static struct sysctl_ctx_list *
 busdma_sysctl_tree(struct bounce_zone *bz)
 {
 
 	return (&bz->sysctl_tree);
 }
 
 static struct sysctl_oid *
 busdma_sysctl_tree_top(struct bounce_zone *bz)
 {
 
 	return (bz->sysctl_tree_top);
 }
 
 static int
 alloc_bounce_zone(bus_dma_tag_t dmat)
 {
 	struct bounce_zone *bz;
 
 	/* Check to see if we already have a suitable zone */
 	STAILQ_FOREACH(bz, &bounce_zone_list, links) {
 		if ((dmat->alignment <= bz->alignment) &&
 		    (dmat->lowaddr >= bz->lowaddr)) {
 			dmat->bounce_zone = bz;
 			return (0);
 		}
 	}
 
 	if ((bz = (struct bounce_zone *)malloc(sizeof(*bz), M_BUSDMA,
 	    M_NOWAIT | M_ZERO)) == NULL)
 		return (ENOMEM);
 
 	STAILQ_INIT(&bz->bounce_page_list);
 	bz->free_bpages = 0;
 	bz->reserved_bpages = 0;
 	bz->active_bpages = 0;
 	bz->lowaddr = dmat->lowaddr;
 	bz->alignment = MAX(dmat->alignment, PAGE_SIZE);
 	bz->map_count = 0;
 	snprintf(bz->zoneid, 8, "zone%d", busdma_zonecount);
 	busdma_zonecount++;
 	snprintf(bz->lowaddrid, 18, "%#jx", (uintmax_t)bz->lowaddr);
 	STAILQ_INSERT_TAIL(&bounce_zone_list, bz, links);
 	dmat->bounce_zone = bz;
 
 	sysctl_ctx_init(&bz->sysctl_tree);
 	bz->sysctl_tree_top = SYSCTL_ADD_NODE(&bz->sysctl_tree,
 	    SYSCTL_STATIC_CHILDREN(_hw_busdma), OID_AUTO, bz->zoneid,
 	    CTLFLAG_RD | CTLFLAG_MPSAFE, 0, "");
 	if (bz->sysctl_tree_top == NULL) {
 		sysctl_ctx_free(&bz->sysctl_tree);
 		return (0);	/* XXX error code? */
 	}
 
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bpages", CTLFLAG_RD, &bz->total_bpages, 0,
 	    "Total bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "free_bpages", CTLFLAG_RD, &bz->free_bpages, 0,
 	    "Free bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "reserved_bpages", CTLFLAG_RD, &bz->reserved_bpages, 0,
 	    "Reserved bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "active_bpages", CTLFLAG_RD, &bz->active_bpages, 0,
 	    "Active bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bounced", CTLFLAG_RD, &bz->total_bounced, 0,
 	    "Total bounce requests (pages bounced)");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_deferred", CTLFLAG_RD, &bz->total_deferred, 0,
 	    "Total bounce requests that were deferred");
 	SYSCTL_ADD_STRING(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "lowaddr", CTLFLAG_RD, bz->lowaddrid, 0, "");
 	SYSCTL_ADD_ULONG(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "alignment", CTLFLAG_RD, &bz->alignment, "");
 
 	return (0);
 }
 
 static int
 alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages)
 {
 	struct bounce_zone *bz;
 	int count;
 
 	bz = dmat->bounce_zone;
 	count = 0;
 	while (numpages > 0) {
 		struct bounce_page *bpage;
 
 		bpage = (struct bounce_page *)malloc(sizeof(*bpage), M_BUSDMA,
 		    M_NOWAIT | M_ZERO);
 
 		if (bpage == NULL)
 			break;
 		bpage->vaddr = (vm_offset_t)contigmalloc(PAGE_SIZE, M_BOUNCE,
 		    M_NOWAIT, 0ul, bz->lowaddr, PAGE_SIZE, 0);
 		if (bpage->vaddr == 0) {
 			free(bpage, M_BUSDMA);
 			break;
 		}
 		bpage->busaddr = pmap_kextract(bpage->vaddr);
 		mtx_lock(&bounce_lock);
 		STAILQ_INSERT_TAIL(&bz->bounce_page_list, bpage, links);
 		total_bpages++;
 		bz->total_bpages++;
 		bz->free_bpages++;
 		mtx_unlock(&bounce_lock);
 		count++;
 		numpages--;
 	}
 	return (count);
 }
 
 static int
 reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map, int commit)
 {
 	struct bounce_zone *bz;
 	int pages;
 
 	mtx_assert(&bounce_lock, MA_OWNED);
 	bz = dmat->bounce_zone;
 	pages = MIN(bz->free_bpages, map->pagesneeded - map->pagesreserved);
 	if (commit == 0 && map->pagesneeded > (map->pagesreserved + pages))
 		return (map->pagesneeded - (map->pagesreserved + pages));
 	bz->free_bpages -= pages;
 	bz->reserved_bpages += pages;
 	map->pagesreserved += pages;
 	pages = map->pagesneeded - map->pagesreserved;
 
 	return (pages);
 }
 
 static bus_addr_t
 add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map, vm_offset_t vaddr,
     bus_addr_t addr, bus_size_t size)
 {
 	struct bounce_zone *bz;
 	struct bounce_page *bpage;
 
 	KASSERT(dmat->bounce_zone != NULL, ("no bounce zone in dma tag"));
 	KASSERT(map != NULL, ("add_bounce_page: bad map %p", map));
 
 	bz = dmat->bounce_zone;
 	if (map->pagesneeded == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesneeded--;
 
 	if (map->pagesreserved == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesreserved--;
 
 	mtx_lock(&bounce_lock);
 	bpage = STAILQ_FIRST(&bz->bounce_page_list);
 	if (bpage == NULL)
 		panic("add_bounce_page: free page list is empty");
 
 	STAILQ_REMOVE_HEAD(&bz->bounce_page_list, links);
 	bz->reserved_bpages--;
 	bz->active_bpages++;
 	mtx_unlock(&bounce_lock);
 
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/* Page offset needs to be preserved. */
 		bpage->vaddr |= addr & PAGE_MASK;
 		bpage->busaddr |= addr & PAGE_MASK;
 	}
 	bpage->datavaddr = vaddr;
 	bpage->datapage = PHYS_TO_VM_PAGE(addr);
 	bpage->dataoffs = addr & PAGE_MASK;
 	bpage->datacount = size;
 	STAILQ_INSERT_TAIL(&(map->bpages), bpage, links);
 	return (bpage->busaddr);
 }
 
 static void
 free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage)
 {
 	struct bus_dmamap *map;
 	struct bounce_zone *bz;
 
 	bz = dmat->bounce_zone;
 	bpage->datavaddr = 0;
 	bpage->datacount = 0;
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/*
 		 * Reset the bounce page to start at offset 0.  Other uses
 		 * of this bounce page may need to store a full page of
 		 * data and/or assume it starts on a page boundary.
 		 */
 		bpage->vaddr &= ~PAGE_MASK;
 		bpage->busaddr &= ~PAGE_MASK;
 	}
 
 	mtx_lock(&bounce_lock);
 	STAILQ_INSERT_HEAD(&bz->bounce_page_list, bpage, links);
 	bz->free_bpages++;
 	bz->active_bpages--;
 	if ((map = STAILQ_FIRST(&bounce_map_waitinglist)) != NULL) {
 		if (reserve_bounce_pages(map->dmat, map, 1) == 0) {
 			STAILQ_REMOVE_HEAD(&bounce_map_waitinglist, links);
 			STAILQ_INSERT_TAIL(&bounce_map_callbacklist,
 			    map, links);
 			busdma_swi_pending = 1;
 			bz->total_deferred++;
 			swi_sched(vm_ih, 0);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 }
 
 void
 busdma_swi(void)
 {
 	bus_dma_tag_t dmat;
 	struct bus_dmamap *map;
 
 	mtx_lock(&bounce_lock);
 	while ((map = STAILQ_FIRST(&bounce_map_callbacklist)) != NULL) {
 		STAILQ_REMOVE_HEAD(&bounce_map_callbacklist, links);
 		mtx_unlock(&bounce_lock);
 		dmat = map->dmat;
 		dmat->lockfunc(dmat->lockfuncarg, BUS_DMA_LOCK);
 		bus_dmamap_load_mem(map->dmat, map, &map->mem, map->callback,
 		    map->callback_arg, BUS_DMA_WAITOK);
 		dmat->lockfunc(dmat->lockfuncarg, BUS_DMA_UNLOCK);
 		mtx_lock(&bounce_lock);
 	}
 	mtx_unlock(&bounce_lock);
 }
Index: head/sys/arm64/arm64/busdma_machdep.c
===================================================================
--- head/sys/arm64/arm64/busdma_machdep.c	(revision 365705)
+++ head/sys/arm64/arm64/busdma_machdep.c	(revision 365706)
@@ -1,285 +1,254 @@
 /*-
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * Copyright (c) 2013, 2015 The FreeBSD Foundation
  * All rights reserved.
  *
  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
  * under sponsorship from the FreeBSD Foundation.
  *
  * Portions of this software were developed by Semihalf
  * under sponsorship of the FreeBSD Foundation.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/kernel.h>
 #include <sys/ktr.h>
 #include <sys/lock.h>
 #include <sys/memdesc.h>
 #include <sys/mutex.h>
 #include <sys/uio.h>
 #include <vm/vm.h>
 #include <vm/vm_extern.h>
 #include <vm/pmap.h>
 
 #include <machine/bus.h>
 #include <arm64/include/bus_dma_impl.h>
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 void
 bus_dma_dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 
 	panic("driver error: busdma dflt_lock called");
 }
 
 /*
  * Return true if a match is made.
  *
  * To find a match walk the chain of bus_dma_tag_t's looking for 'paddr'.
  *
  * If paddr is within the bounds of the dma tag then call the filter callback
  * to check for a match, if there is no filter callback then assume a match.
  */
 int
 bus_dma_run_filter(struct bus_dma_tag_common *tc, bus_addr_t paddr)
 {
 	int retval;
 
 	retval = 0;
 	do {
 		if (((paddr > tc->lowaddr && paddr <= tc->highaddr) ||
 		    ((paddr & (tc->alignment - 1)) != 0)) &&
 		    (tc->filter == NULL ||
 		    (*tc->filter)(tc->filterarg, paddr) != 0))
 			retval = 1;
 
 		tc = tc->parent;		
 	} while (retval == 0 && tc != NULL);
 	return (retval);
 }
 
 int
 common_bus_dma_tag_create(struct bus_dma_tag_common *parent,
     bus_size_t alignment, bus_addr_t boundary, bus_addr_t lowaddr,
     bus_addr_t highaddr, bus_dma_filter_t *filter, void *filterarg,
     bus_size_t maxsize, int nsegments, bus_size_t maxsegsz, int flags,
     bus_dma_lock_t *lockfunc, void *lockfuncarg, size_t sz, void **dmat)
 {
 	void *newtag;
 	struct bus_dma_tag_common *common;
 
 	KASSERT(sz >= sizeof(struct bus_dma_tag_common), ("sz"));
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 	/* Basic sanity checking */
 	if (boundary != 0 && boundary < maxsegsz)
 		maxsegsz = boundary;
 	if (maxsegsz == 0)
 		return (EINVAL);
 
 	newtag = malloc(sz, M_DEVBUF, M_ZERO | M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, ENOMEM);
 		return (ENOMEM);
 	}
 
 	common = newtag;
 	common->impl = &bus_dma_bounce_impl;
 	common->parent = parent;
 	common->alignment = alignment;
 	common->boundary = boundary;
 	common->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
 	common->highaddr = trunc_page((vm_paddr_t)highaddr) + (PAGE_SIZE - 1);
 	common->filter = filter;
 	common->filterarg = filterarg;
 	common->maxsize = maxsize;
 	common->nsegments = nsegments;
 	common->maxsegsz = maxsegsz;
 	common->flags = flags;
 	common->ref_count = 1; /* Count ourself */
 	if (lockfunc != NULL) {
 		common->lockfunc = lockfunc;
 		common->lockfuncarg = lockfuncarg;
 	} else {
 		common->lockfunc = bus_dma_dflt_lock;
 		common->lockfuncarg = NULL;
 	}
 
 	/* Take into account any restrictions imposed by our parent tag */
 	if (parent != NULL) {
 		common->impl = parent->impl;
 		common->lowaddr = MIN(parent->lowaddr, common->lowaddr);
 		common->highaddr = MAX(parent->highaddr, common->highaddr);
 		if (common->boundary == 0)
 			common->boundary = parent->boundary;
 		else if (parent->boundary != 0) {
 			common->boundary = MIN(parent->boundary,
 			    common->boundary);
 		}
 		if (common->filter == NULL) {
 			/*
 			 * Short circuit looking at our parent directly
 			 * since we have encapsulated all of its information
 			 */
 			common->filter = parent->filter;
 			common->filterarg = parent->filterarg;
 			common->parent = parent->parent;
 		}
 		atomic_add_int(&parent->ref_count, 1);
 	}
 	*dmat = common;
 	return (0);
 }
 
 /*
  * Allocate a device specific dma_tag.
  */
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
     bus_addr_t boundary, bus_addr_t lowaddr, bus_addr_t highaddr,
     bus_dma_filter_t *filter, void *filterarg, bus_size_t maxsize,
     int nsegments, bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
     void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	struct bus_dma_tag_common *tc;
 	int error;
 
 	if (parent == NULL) {
 		error = bus_dma_bounce_impl.tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	} else {
 		tc = (struct bus_dma_tag_common *)parent;
 		error = tc->impl->tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	}
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *common;
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	common = (struct bus_dma_tag_common *)dmat;
 
 	t->parent = (bus_dma_tag_t)common->parent;
 	t->alignment = common->alignment;
 	t->boundary = common->boundary;
 	t->lowaddr = common->lowaddr;
 	t->highaddr = common->highaddr;
 	t->maxsize = common->maxsize;
 	t->nsegments = common->nsegments;
 	t->maxsegsize = common->maxsegsz;
 	t->flags = common->flags;
 	t->lockfunc = common->lockfunc;
 	t->lockfuncarg = common->lockfuncarg;
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *tc;
 
 	tc = (struct bus_dma_tag_common *)dmat;
 	return (tc->impl->tag_destroy(dmat));
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 
 	return (0);
 }
Index: head/sys/dev/mpr/mpr.c
===================================================================
--- head/sys/dev/mpr/mpr.c	(revision 365705)
+++ head/sys/dev/mpr/mpr.c	(revision 365706)
@@ -1,3985 +1,3981 @@
 /*-
  * Copyright (c) 2009 Yahoo! Inc.
  * Copyright (c) 2011-2015 LSI Corp.
  * Copyright (c) 2013-2016 Avago Technologies
  * Copyright 2000-2020 Broadcom Inc.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Broadcom Inc. (LSI) MPT-Fusion Host Adapter FreeBSD
  *
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* Communications core for Avago Technologies (LSI) MPT3 */
 
 /* TODO Move headers to mprvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/selinfo.h>
 #include <sys/lock.h>
 #include <sys/mutex.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/bio.h>
 #include <sys/malloc.h>
 #include <sys/uio.h>
 #include <sys/sysctl.h>
 #include <sys/smp.h>
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <sys/taskqueue.h>
 #include <sys/endian.h>
 #include <sys/eventhandler.h>
 #include <sys/sbuf.h>
 #include <sys/priv.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 #include <sys/proc.h>
 
 #include <dev/pci/pcivar.h>
 
 #include <cam/cam.h>
 #include <cam/cam_ccb.h>
 #include <cam/scsi/scsi_all.h>
 
 #include <dev/mpr/mpi/mpi2_type.h>
 #include <dev/mpr/mpi/mpi2.h>
 #include <dev/mpr/mpi/mpi2_ioc.h>
 #include <dev/mpr/mpi/mpi2_sas.h>
 #include <dev/mpr/mpi/mpi2_pci.h>
 #include <dev/mpr/mpi/mpi2_cnfg.h>
 #include <dev/mpr/mpi/mpi2_init.h>
 #include <dev/mpr/mpi/mpi2_tool.h>
 #include <dev/mpr/mpr_ioctl.h>
 #include <dev/mpr/mprvar.h>
 #include <dev/mpr/mpr_table.h>
 #include <dev/mpr/mpr_sas.h>
 
 static int mpr_diag_reset(struct mpr_softc *sc, int sleep_flag);
 static int mpr_init_queues(struct mpr_softc *sc);
 static void mpr_resize_queues(struct mpr_softc *sc);
 static int mpr_message_unit_reset(struct mpr_softc *sc, int sleep_flag);
 static int mpr_transition_operational(struct mpr_softc *sc);
 static int mpr_iocfacts_allocate(struct mpr_softc *sc, uint8_t attaching);
 static void mpr_iocfacts_free(struct mpr_softc *sc);
 static void mpr_startup(void *arg);
 static int mpr_send_iocinit(struct mpr_softc *sc);
 static int mpr_alloc_queues(struct mpr_softc *sc);
 static int mpr_alloc_hw_queues(struct mpr_softc *sc);
 static int mpr_alloc_replies(struct mpr_softc *sc);
 static int mpr_alloc_requests(struct mpr_softc *sc);
 static int mpr_alloc_nvme_prp_pages(struct mpr_softc *sc);
 static int mpr_attach_log(struct mpr_softc *sc);
 static __inline void mpr_complete_command(struct mpr_softc *sc,
     struct mpr_command *cm);
 static void mpr_dispatch_event(struct mpr_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *reply);
 static void mpr_config_complete(struct mpr_softc *sc, struct mpr_command *cm);
 static void mpr_periodic(void *);
 static int mpr_reregister_events(struct mpr_softc *sc);
 static void mpr_enqueue_request(struct mpr_softc *sc, struct mpr_command *cm);
 static int mpr_get_iocfacts(struct mpr_softc *sc, MPI2_IOC_FACTS_REPLY *facts);
 static int mpr_wait_db_ack(struct mpr_softc *sc, int timeout, int sleep_flag);
 static int mpr_debug_sysctl(SYSCTL_HANDLER_ARGS);
 static int mpr_dump_reqs(SYSCTL_HANDLER_ARGS);
 static void mpr_parse_debug(struct mpr_softc *sc, char *list);
 
 SYSCTL_NODE(_hw, OID_AUTO, mpr, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
     "MPR Driver Parameters");
 
 MALLOC_DEFINE(M_MPR, "mpr", "mpr driver memory");
 
 /*
  * Do a "Diagnostic Reset" aka a hard reset.  This should get the chip out of
  * any state and back to its initialization state machine.
  */
 static char mpt2_reset_magic[] = { 0x00, 0x0f, 0x04, 0x0b, 0x02, 0x07, 0x0d };
 
 /* 
  * Added this union to smoothly convert le64toh cm->cm_desc.Words.
  * Compiler only supports uint64_t to be passed as an argument.
  * Otherwise it will throw this error:
  * "aggregate value used where an integer was expected"
  */
 typedef union _reply_descriptor {
         u64 word;
         struct {
                 u32 low;
                 u32 high;
         } u;
 } reply_descriptor, request_descriptor;
 
 /* Rate limit chain-fail messages to 1 per minute */
 static struct timeval mpr_chainfail_interval = { 60, 0 };
 
 /* 
  * sleep_flag can be either CAN_SLEEP or NO_SLEEP.
  * If this function is called from process context, it can sleep
  * and there is no harm to sleep, in case if this fuction is called
  * from Interrupt handler, we can not sleep and need NO_SLEEP flag set.
  * based on sleep flags driver will call either msleep, pause or DELAY.
  * msleep and pause are of same variant, but pause is used when mpr_mtx
  * is not hold by driver.
  */
 static int
 mpr_diag_reset(struct mpr_softc *sc,int sleep_flag)
 {
 	uint32_t reg;
 	int i, error, tries = 0;
 	uint8_t first_wait_done = FALSE;
 
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	/* Clear any pending interrupts */
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/*
 	 * Force NO_SLEEP for threads prohibited to sleep
  	 * e.a Thread from interrupt handler are prohibited to sleep.
  	 */
 	if (curthread->td_no_sleeping)
 		sleep_flag = NO_SLEEP;
 
 	mpr_dprint(sc, MPR_INIT, "sequence start, sleep_flag=%d\n", sleep_flag);
 	/* Push the magic sequence */
 	error = ETIMEDOUT;
 	while (tries++ < 20) {
 		for (i = 0; i < sizeof(mpt2_reset_magic); i++)
 			mpr_regwrite(sc, MPI2_WRITE_SEQUENCE_OFFSET,
 			    mpt2_reset_magic[i]);
 
 		/* wait 100 msec */
 		if (mtx_owned(&sc->mpr_mtx) && sleep_flag == CAN_SLEEP)
 			msleep(&sc->msleep_fake_chan, &sc->mpr_mtx, 0,
 			    "mprdiag", hz/10);
 		else if (sleep_flag == CAN_SLEEP)
 			pause("mprdiag", hz/10);
 		else
 			DELAY(100 * 1000);
 
 		reg = mpr_regread(sc, MPI2_HOST_DIAGNOSTIC_OFFSET);
 		if (reg & MPI2_DIAG_DIAG_WRITE_ENABLE) {
 			error = 0;
 			break;
 		}
 	}
 	if (error) {
 		mpr_dprint(sc, MPR_INIT, "sequence failed, error=%d, exit\n",
 		    error);
 		return (error);
 	}
 
 	/* Send the actual reset.  XXX need to refresh the reg? */
 	reg |= MPI2_DIAG_RESET_ADAPTER;
 	mpr_dprint(sc, MPR_INIT, "sequence success, sending reset, reg= 0x%x\n",
 	    reg);
 	mpr_regwrite(sc, MPI2_HOST_DIAGNOSTIC_OFFSET, reg);
 
 	/* Wait up to 300 seconds in 50ms intervals */
 	error = ETIMEDOUT;
 	for (i = 0; i < 6000; i++) {
 		/*
 		 * Wait 50 msec. If this is the first time through, wait 256
 		 * msec to satisfy Diag Reset timing requirements.
 		 */
 		if (first_wait_done) {
 			if (mtx_owned(&sc->mpr_mtx) && sleep_flag == CAN_SLEEP)
 				msleep(&sc->msleep_fake_chan, &sc->mpr_mtx, 0,
 				    "mprdiag", hz/20);
 			else if (sleep_flag == CAN_SLEEP)
 				pause("mprdiag", hz/20);
 			else
 				DELAY(50 * 1000);
 		} else {
 			DELAY(256 * 1000);
 			first_wait_done = TRUE;
 		}
 		/*
 		 * Check for the RESET_ADAPTER bit to be cleared first, then
 		 * wait for the RESET state to be cleared, which takes a little
 		 * longer.
 		 */
 		reg = mpr_regread(sc, MPI2_HOST_DIAGNOSTIC_OFFSET);
 		if (reg & MPI2_DIAG_RESET_ADAPTER) {
 			continue;
 		}
 		reg = mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 		if ((reg & MPI2_IOC_STATE_MASK) != MPI2_IOC_STATE_RESET) {
 			error = 0;
 			break;
 		}
 	}
 	if (error) {
 		mpr_dprint(sc, MPR_INIT, "reset failed, error= %d, exit\n",
 		    error);
 		return (error);
 	}
 
 	mpr_regwrite(sc, MPI2_WRITE_SEQUENCE_OFFSET, 0x0);
 	mpr_dprint(sc, MPR_INIT, "diag reset success, exit\n");
 
 	return (0);
 }
 
 static int
 mpr_message_unit_reset(struct mpr_softc *sc, int sleep_flag)
 {
 	int error;
 
 	MPR_FUNCTRACE(sc);
 
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	error = 0;
 	mpr_regwrite(sc, MPI2_DOORBELL_OFFSET,
 	    MPI2_FUNCTION_IOC_MESSAGE_UNIT_RESET <<
 	    MPI2_DOORBELL_FUNCTION_SHIFT);
 
 	if (mpr_wait_db_ack(sc, 5, sleep_flag) != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 		    "Doorbell handshake failed\n");
 		error = ETIMEDOUT;
 	}
 
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 	return (error);
 }
 
 static int
 mpr_transition_ready(struct mpr_softc *sc)
 {
 	uint32_t reg, state;
 	int error, tries = 0;
 	int sleep_flags;
 
 	MPR_FUNCTRACE(sc);
 	/* If we are in attach call, do not sleep */
 	sleep_flags = (sc->mpr_flags & MPR_FLAGS_ATTACH_DONE)
 	    ? CAN_SLEEP : NO_SLEEP;
 
 	error = 0;
 
 	mpr_dprint(sc, MPR_INIT, "%s entered, sleep_flags= %d\n",
 	    __func__, sleep_flags);
 
 	while (tries++ < 1200) {
 		reg = mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 		mpr_dprint(sc, MPR_INIT, "  Doorbell= 0x%x\n", reg);
 
 		/*
 		 * Ensure the IOC is ready to talk.  If it's not, try
 		 * resetting it.
 		 */
 		if (reg & MPI2_DOORBELL_USED) {
 			mpr_dprint(sc, MPR_INIT, "  Not ready, sending diag "
 			    "reset\n");
 			mpr_diag_reset(sc, sleep_flags);
 			DELAY(50000);
 			continue;
 		}
 
 		/* Is the adapter owned by another peer? */
 		if ((reg & MPI2_DOORBELL_WHO_INIT_MASK) ==
 		    (MPI2_WHOINIT_PCI_PEER << MPI2_DOORBELL_WHO_INIT_SHIFT)) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, "IOC is under the "
 			    "control of another peer host, aborting "
 			    "initialization.\n");
 			error = ENXIO;
 			break;
 		}
 		
 		state = reg & MPI2_IOC_STATE_MASK;
 		if (state == MPI2_IOC_STATE_READY) {
 			/* Ready to go! */
 			error = 0;
 			break;
 		} else if (state == MPI2_IOC_STATE_FAULT) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, "IOC in fault "
 			    "state 0x%x, resetting\n",
 			    state & MPI2_DOORBELL_FAULT_CODE_MASK);
 			mpr_diag_reset(sc, sleep_flags);
 		} else if (state == MPI2_IOC_STATE_OPERATIONAL) {
 			/* Need to take ownership */
 			mpr_message_unit_reset(sc, sleep_flags);
 		} else if (state == MPI2_IOC_STATE_RESET) {
 			/* Wait a bit, IOC might be in transition */
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 			    "IOC in unexpected reset state\n");
 		} else {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 			    "IOC in unknown state 0x%x\n", state);
 			error = EINVAL;
 			break;
 		}
 
 		/* Wait 50ms for things to settle down. */
 		DELAY(50000);
 	}
 
 	if (error)
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 		    "Cannot transition IOC to ready\n");
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 	return (error);
 }
 
 static int
 mpr_transition_operational(struct mpr_softc *sc)
 {
 	uint32_t reg, state;
 	int error;
 
 	MPR_FUNCTRACE(sc);
 
 	error = 0;
 	reg = mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 	mpr_dprint(sc, MPR_INIT, "%s entered, Doorbell= 0x%x\n", __func__, reg);
 
 	state = reg & MPI2_IOC_STATE_MASK;
 	if (state != MPI2_IOC_STATE_READY) {
 		mpr_dprint(sc, MPR_INIT, "IOC not ready\n");
 		if ((error = mpr_transition_ready(sc)) != 0) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, 
 			    "failed to transition ready, exit\n");
 			return (error);
 		}
 	}
 
 	error = mpr_send_iocinit(sc);
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 
 	return (error);
 }
 
 static void
 mpr_resize_queues(struct mpr_softc *sc)
 {
 	u_int reqcr, prireqcr, maxio, sges_per_frame, chain_seg_size;
 
 	/*
 	 * Size the queues. Since the reply queues always need one free
 	 * entry, we'll deduct one reply message here.  The LSI documents
 	 * suggest instead to add a count to the request queue, but I think
 	 * that it's better to deduct from reply queue.
 	 */
 	prireqcr = MAX(1, sc->max_prireqframes);
 	prireqcr = MIN(prireqcr, sc->facts->HighPriorityCredit);
 
 	reqcr = MAX(2, sc->max_reqframes);
 	reqcr = MIN(reqcr, sc->facts->RequestCredit);
 
 	sc->num_reqs = prireqcr + reqcr;
 	sc->num_prireqs = prireqcr;
 	sc->num_replies = MIN(sc->max_replyframes + sc->max_evtframes,
 	    sc->facts->MaxReplyDescriptorPostQueueDepth) - 1;
 
 	/* Store the request frame size in bytes rather than as 32bit words */
 	sc->reqframesz = sc->facts->IOCRequestFrameSize * 4;
 
 	/*
 	 * Gen3 and beyond uses the IOCMaxChainSegmentSize from IOC Facts to
 	 * get the size of a Chain Frame.  Previous versions use the size as a
 	 * Request Frame for the Chain Frame size.  If IOCMaxChainSegmentSize
 	 * is 0, use the default value.  The IOCMaxChainSegmentSize is the
 	 * number of 16-byte elelements that can fit in a Chain Frame, which is
 	 * the size of an IEEE Simple SGE.
 	 */
 	if (sc->facts->MsgVersion >= MPI2_VERSION_02_05) {
 		chain_seg_size = htole16(sc->facts->IOCMaxChainSegmentSize);
 		if (chain_seg_size == 0)
 			chain_seg_size = MPR_DEFAULT_CHAIN_SEG_SIZE;
 		sc->chain_frame_size = chain_seg_size *
 		    MPR_MAX_CHAIN_ELEMENT_SIZE;
 	} else {
 		sc->chain_frame_size = sc->reqframesz;
 	}
 
 	/*
 	 * Max IO Size is Page Size * the following:
 	 * ((SGEs per frame - 1 for chain element) * Max Chain Depth)
 	 * + 1 for no chain needed in last frame
 	 *
 	 * If user suggests a Max IO size to use, use the smaller of the
 	 * user's value and the calculated value as long as the user's
 	 * value is larger than 0. The user's value is in pages.
 	 */
 	sges_per_frame = sc->chain_frame_size/sizeof(MPI2_IEEE_SGE_SIMPLE64)-1;
 	maxio = (sges_per_frame * sc->facts->MaxChainDepth + 1) * PAGE_SIZE;
 
 	/*
 	 * If I/O size limitation requested then use it and pass up to CAM.
 	 * If not, use MAXPHYS as an optimization hint, but report HW limit.
 	 */
 	if (sc->max_io_pages > 0) {
 		maxio = min(maxio, sc->max_io_pages * PAGE_SIZE);
 		sc->maxio = maxio;
 	} else {
 		sc->maxio = maxio;
 		maxio = min(maxio, MAXPHYS);
 	}
 
 	sc->num_chains = (maxio / PAGE_SIZE + sges_per_frame - 2) /
 	    sges_per_frame * reqcr;
 	if (sc->max_chains > 0 && sc->max_chains < sc->num_chains)
 		sc->num_chains = sc->max_chains;
 
 	/*
 	 * Figure out the number of MSIx-based queues.  If the firmware or
 	 * user has done something crazy and not allowed enough credit for
 	 * the queues to be useful then don't enable multi-queue.
 	 */
 	if (sc->facts->MaxMSIxVectors < 2)
 		sc->msi_msgs = 1;
 
 	if (sc->msi_msgs > 1) {
 		sc->msi_msgs = MIN(sc->msi_msgs, mp_ncpus);
 		sc->msi_msgs = MIN(sc->msi_msgs, sc->facts->MaxMSIxVectors);
 		if (sc->num_reqs / sc->msi_msgs < 2)
 			sc->msi_msgs = 1;
 	}
 
 	mpr_dprint(sc, MPR_INIT, "Sized queues to q=%d reqs=%d replies=%d\n",
 	    sc->msi_msgs, sc->num_reqs, sc->num_replies);
 }
 
 /*
  * This is called during attach and when re-initializing due to a Diag Reset.
  * IOC Facts is used to allocate many of the structures needed by the driver.
  * If called from attach, de-allocation is not required because the driver has
  * not allocated any structures yet, but if called from a Diag Reset, previously
  * allocated structures based on IOC Facts will need to be freed and re-
  * allocated bases on the latest IOC Facts.
  */
 static int
 mpr_iocfacts_allocate(struct mpr_softc *sc, uint8_t attaching)
 {
 	int error;
 	Mpi2IOCFactsReply_t saved_facts;
 	uint8_t saved_mode, reallocating;
 
 	mpr_dprint(sc, MPR_INIT|MPR_TRACE, "%s entered\n", __func__);
 
 	/* Save old IOC Facts and then only reallocate if Facts have changed */
 	if (!attaching) {
 		bcopy(sc->facts, &saved_facts, sizeof(MPI2_IOC_FACTS_REPLY));
 	}
 
 	/*
 	 * Get IOC Facts.  In all cases throughout this function, panic if doing
 	 * a re-initialization and only return the error if attaching so the OS
 	 * can handle it.
 	 */
 	if ((error = mpr_get_iocfacts(sc, sc->facts)) != 0) {
 		if (attaching) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, "Failed to get "
 			    "IOC Facts with error %d, exit\n", error);
 			return (error);
 		} else {
 			panic("%s failed to get IOC Facts with error %d\n",
 			    __func__, error);
 		}
 	}
 
 	MPR_DPRINT_PAGE(sc, MPR_XINFO, iocfacts, sc->facts);
 
 	snprintf(sc->fw_version, sizeof(sc->fw_version), 
 	    "%02d.%02d.%02d.%02d", 
 	    sc->facts->FWVersion.Struct.Major,
 	    sc->facts->FWVersion.Struct.Minor,
 	    sc->facts->FWVersion.Struct.Unit,
 	    sc->facts->FWVersion.Struct.Dev);
 
 	snprintf(sc->msg_version, sizeof(sc->msg_version), "%d.%d",
 	    (sc->facts->MsgVersion & MPI2_IOCFACTS_MSGVERSION_MAJOR_MASK) >>
 	    MPI2_IOCFACTS_MSGVERSION_MAJOR_SHIFT,
 	    (sc->facts->MsgVersion & MPI2_IOCFACTS_MSGVERSION_MINOR_MASK) >>
 	    MPI2_IOCFACTS_MSGVERSION_MINOR_SHIFT);
 
 	mpr_dprint(sc, MPR_INFO, "Firmware: %s, Driver: %s\n", sc->fw_version,
 	    MPR_DRIVER_VERSION);
 	mpr_dprint(sc, MPR_INFO,
 	    "IOCCapabilities: %b\n", sc->facts->IOCCapabilities,
 	    "\20" "\3ScsiTaskFull" "\4DiagTrace" "\5SnapBuf" "\6ExtBuf"
 	    "\7EEDP" "\10BiDirTarg" "\11Multicast" "\14TransRetry" "\15IR"
 	    "\16EventReplay" "\17RaidAccel" "\20MSIXIndex" "\21HostDisc"
 	    "\22FastPath" "\23RDPQArray" "\24AtomicReqDesc" "\25PCIeSRIOV");
 
 	/*
 	 * If the chip doesn't support event replay then a hard reset will be
 	 * required to trigger a full discovery.  Do the reset here then
 	 * retransition to Ready.  A hard reset might have already been done,
 	 * but it doesn't hurt to do it again.  Only do this if attaching, not
 	 * for a Diag Reset.
 	 */
 	if (attaching && ((sc->facts->IOCCapabilities &
 	    MPI2_IOCFACTS_CAPABILITY_EVENT_REPLAY) == 0)) {
 		mpr_dprint(sc, MPR_INIT, "No event replay, resetting\n");
 		mpr_diag_reset(sc, NO_SLEEP);
 		if ((error = mpr_transition_ready(sc)) != 0) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, "Failed to "
 			    "transition to ready with error %d, exit\n",
 			    error);
 			return (error);
 		}
 	}
 
 	/*
 	 * Set flag if IR Firmware is loaded.  If the RAID Capability has
 	 * changed from the previous IOC Facts, log a warning, but only if
 	 * checking this after a Diag Reset and not during attach.
 	 */
 	saved_mode = sc->ir_firmware;
 	if (sc->facts->IOCCapabilities &
 	    MPI2_IOCFACTS_CAPABILITY_INTEGRATED_RAID)
 		sc->ir_firmware = 1;
 	if (!attaching) {
 		if (sc->ir_firmware != saved_mode) {
 			mpr_dprint(sc, MPR_INIT|MPR_FAULT, "new IR/IT mode "
 			    "in IOC Facts does not match previous mode\n");
 		}
 	}
 
 	/* Only deallocate and reallocate if relevant IOC Facts have changed */
 	reallocating = FALSE;
 	sc->mpr_flags &= ~MPR_FLAGS_REALLOCATED;
 
 	if ((!attaching) &&
 	    ((saved_facts.MsgVersion != sc->facts->MsgVersion) ||
 	    (saved_facts.HeaderVersion != sc->facts->HeaderVersion) ||
 	    (saved_facts.MaxChainDepth != sc->facts->MaxChainDepth) ||
 	    (saved_facts.RequestCredit != sc->facts->RequestCredit) ||
 	    (saved_facts.ProductID != sc->facts->ProductID) ||
 	    (saved_facts.IOCCapabilities != sc->facts->IOCCapabilities) ||
 	    (saved_facts.IOCRequestFrameSize !=
 	    sc->facts->IOCRequestFrameSize) ||
 	    (saved_facts.IOCMaxChainSegmentSize !=
 	    sc->facts->IOCMaxChainSegmentSize) ||
 	    (saved_facts.MaxTargets != sc->facts->MaxTargets) ||
 	    (saved_facts.MaxSasExpanders != sc->facts->MaxSasExpanders) ||
 	    (saved_facts.MaxEnclosures != sc->facts->MaxEnclosures) ||
 	    (saved_facts.HighPriorityCredit != sc->facts->HighPriorityCredit) ||
 	    (saved_facts.MaxReplyDescriptorPostQueueDepth !=
 	    sc->facts->MaxReplyDescriptorPostQueueDepth) ||
 	    (saved_facts.ReplyFrameSize != sc->facts->ReplyFrameSize) ||
 	    (saved_facts.MaxVolumes != sc->facts->MaxVolumes) ||
 	    (saved_facts.MaxPersistentEntries !=
 	    sc->facts->MaxPersistentEntries))) {
 		reallocating = TRUE;
 
 		/* Record that we reallocated everything */
 		sc->mpr_flags |= MPR_FLAGS_REALLOCATED;
 	}
 
 	/*
 	 * Some things should be done if attaching or re-allocating after a Diag
 	 * Reset, but are not needed after a Diag Reset if the FW has not
 	 * changed.
 	 */
 	if (attaching || reallocating) {
 		/*
 		 * Check if controller supports FW diag buffers and set flag to
 		 * enable each type.
 		 */
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_DIAG_TRACE_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_TRACE].
 			    enabled = TRUE;
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_SNAPSHOT_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_SNAPSHOT].
 			    enabled = TRUE;
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_EXTENDED_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_EXTENDED].
 			    enabled = TRUE;
 
 		/*
 		 * Set flags for some supported items.
 		 */
 		if (sc->facts->IOCCapabilities & MPI2_IOCFACTS_CAPABILITY_EEDP)
 			sc->eedp_enabled = TRUE;
 		if (sc->facts->IOCCapabilities & MPI2_IOCFACTS_CAPABILITY_TLR)
 			sc->control_TLR = TRUE;
 		if ((sc->facts->IOCCapabilities &
 		    MPI26_IOCFACTS_CAPABILITY_ATOMIC_REQ) &&
 		    (sc->mpr_flags & MPR_FLAGS_SEA_IOC))
 			sc->atomic_desc_capable = TRUE;
 
 		mpr_resize_queues(sc);
 
 		/*
 		 * Initialize all Tail Queues
 		 */
 		TAILQ_INIT(&sc->req_list);
 		TAILQ_INIT(&sc->high_priority_req_list);
 		TAILQ_INIT(&sc->chain_list);
 		TAILQ_INIT(&sc->prp_page_list);
 		TAILQ_INIT(&sc->tm_list);
 	}
 
 	/*
 	 * If doing a Diag Reset and the FW is significantly different
 	 * (reallocating will be set above in IOC Facts comparison), then all
 	 * buffers based on the IOC Facts will need to be freed before they are
 	 * reallocated.
 	 */
 	if (reallocating) {
 		mpr_iocfacts_free(sc);
 		mprsas_realloc_targets(sc, saved_facts.MaxTargets +
 		    saved_facts.MaxVolumes);
 	}
 
 	/*
 	 * Any deallocation has been completed.  Now start reallocating
 	 * if needed.  Will only need to reallocate if attaching or if the new
 	 * IOC Facts are different from the previous IOC Facts after a Diag
 	 * Reset. Targets have already been allocated above if needed.
 	 */
 	error = 0;
 	while (attaching || reallocating) {
 		if ((error = mpr_alloc_hw_queues(sc)) != 0)
 			break;
 		if ((error = mpr_alloc_replies(sc)) != 0)
 			break;
 		if ((error = mpr_alloc_requests(sc)) != 0)
 			break;
 		if ((error = mpr_alloc_queues(sc)) != 0)
 			break;
 		break;
 	}
 	if (error) {
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "Failed to alloc queues with error %d\n", error);
 		mpr_free(sc);
 		return (error);
 	}
 
 	/* Always initialize the queues */
 	bzero(sc->free_queue, sc->fqdepth * 4);
 	mpr_init_queues(sc);
 
 	/*
 	 * Always get the chip out of the reset state, but only panic if not
 	 * attaching.  If attaching and there is an error, that is handled by
 	 * the OS.
 	 */
 	error = mpr_transition_operational(sc);
 	if (error != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT, "Failed to "
 		    "transition to operational with error %d\n", error);
 		mpr_free(sc);
 		return (error);
 	}
 
 	/*
 	 * Finish the queue initialization.
 	 * These are set here instead of in mpr_init_queues() because the
 	 * IOC resets these values during the state transition in
 	 * mpr_transition_operational().  The free index is set to 1
 	 * because the corresponding index in the IOC is set to 0, and the
 	 * IOC treats the queues as full if both are set to the same value.
 	 * Hence the reason that the queue can't hold all of the possible
 	 * replies.
 	 */
 	sc->replypostindex = 0;
 	mpr_regwrite(sc, MPI2_REPLY_FREE_HOST_INDEX_OFFSET, sc->replyfreeindex);
 	mpr_regwrite(sc, MPI2_REPLY_POST_HOST_INDEX_OFFSET, 0);
 
 	/*
 	 * Attach the subsystems so they can prepare their event masks.
 	 * XXX Should be dynamic so that IM/IR and user modules can attach
 	 */
 	error = 0;
 	while (attaching) {
 		mpr_dprint(sc, MPR_INIT, "Attaching subsystems\n");
 		if ((error = mpr_attach_log(sc)) != 0)
 			break;
 		if ((error = mpr_attach_sas(sc)) != 0)
 			break;
 		if ((error = mpr_attach_user(sc)) != 0)
 			break;
 		break;
 	}
 	if (error) {
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "Failed to attach all subsystems: error %d\n", error);
 		mpr_free(sc);
 		return (error);
 	}
 
 	/*
 	 * XXX If the number of MSI-X vectors changes during re-init, this
 	 * won't see it and adjust.
 	 */
 	if (attaching && (error = mpr_pci_setup_interrupts(sc)) != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "Failed to setup interrupts\n");
 		mpr_free(sc);
 		return (error);
 	}
 
 	return (error);
 }
 
 /*
  * This is called if memory is being free (during detach for example) and when
  * buffers need to be reallocated due to a Diag Reset.
  */
 static void
 mpr_iocfacts_free(struct mpr_softc *sc)
 {
 	struct mpr_command *cm;
 	int i;
 
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	if (sc->free_busaddr != 0)
 		bus_dmamap_unload(sc->queues_dmat, sc->queues_map);
 	if (sc->free_queue != NULL)
 		bus_dmamem_free(sc->queues_dmat, sc->free_queue,
 		    sc->queues_map);
 	if (sc->queues_dmat != NULL)
 		bus_dma_tag_destroy(sc->queues_dmat);
 
 	if (sc->chain_frames != NULL) {
 		bus_dmamap_unload(sc->chain_dmat, sc->chain_map);
 		bus_dmamem_free(sc->chain_dmat, sc->chain_frames,
 		    sc->chain_map);
 	}
 	if (sc->chain_dmat != NULL)
 		bus_dma_tag_destroy(sc->chain_dmat);
 
 	if (sc->sense_busaddr != 0)
 		bus_dmamap_unload(sc->sense_dmat, sc->sense_map);
 	if (sc->sense_frames != NULL)
 		bus_dmamem_free(sc->sense_dmat, sc->sense_frames,
 		    sc->sense_map);
 	if (sc->sense_dmat != NULL)
 		bus_dma_tag_destroy(sc->sense_dmat);
 
 	if (sc->prp_page_busaddr != 0)
 		bus_dmamap_unload(sc->prp_page_dmat, sc->prp_page_map);
 	if (sc->prp_pages != NULL)
 		bus_dmamem_free(sc->prp_page_dmat, sc->prp_pages,
 		    sc->prp_page_map);
 	if (sc->prp_page_dmat != NULL)
 		bus_dma_tag_destroy(sc->prp_page_dmat);
 
 	if (sc->reply_busaddr != 0)
 		bus_dmamap_unload(sc->reply_dmat, sc->reply_map);
 	if (sc->reply_frames != NULL)
 		bus_dmamem_free(sc->reply_dmat, sc->reply_frames,
 		    sc->reply_map);
 	if (sc->reply_dmat != NULL)
 		bus_dma_tag_destroy(sc->reply_dmat);
 
 	if (sc->req_busaddr != 0)
 		bus_dmamap_unload(sc->req_dmat, sc->req_map);
 	if (sc->req_frames != NULL)
 		bus_dmamem_free(sc->req_dmat, sc->req_frames, sc->req_map);
 	if (sc->req_dmat != NULL)
 		bus_dma_tag_destroy(sc->req_dmat);
 
 	if (sc->chains != NULL)
 		free(sc->chains, M_MPR);
 	if (sc->prps != NULL)
 		free(sc->prps, M_MPR);
 	if (sc->commands != NULL) {
 		for (i = 1; i < sc->num_reqs; i++) {
 			cm = &sc->commands[i];
 			bus_dmamap_destroy(sc->buffer_dmat, cm->cm_dmamap);
 		}
 		free(sc->commands, M_MPR);
 	}
 	if (sc->buffer_dmat != NULL)
 		bus_dma_tag_destroy(sc->buffer_dmat);
 
 	mpr_pci_free_interrupts(sc);
 	free(sc->queues, M_MPR);
 	sc->queues = NULL;
 }
 
 /* 
  * The terms diag reset and hard reset are used interchangeably in the MPI
  * docs to mean resetting the controller chip.  In this code diag reset
  * cleans everything up, and the hard reset function just sends the reset
  * sequence to the chip.  This should probably be refactored so that every
  * subsystem gets a reset notification of some sort, and can clean up
  * appropriately.
  */
 int
 mpr_reinit(struct mpr_softc *sc)
 {
 	int error;
 	struct mprsas_softc *sassc;
 
 	sassc = sc->sassc;
 
 	MPR_FUNCTRACE(sc);
 
 	mtx_assert(&sc->mpr_mtx, MA_OWNED);
 
 	mpr_dprint(sc, MPR_INIT|MPR_INFO, "Reinitializing controller\n");
 	if (sc->mpr_flags & MPR_FLAGS_DIAGRESET) {
 		mpr_dprint(sc, MPR_INIT, "Reset already in progress\n");
 		return 0;
 	}
 
 	/*
 	 * Make sure the completion callbacks can recognize they're getting
 	 * a NULL cm_reply due to a reset.
 	 */
 	sc->mpr_flags |= MPR_FLAGS_DIAGRESET;
 
 	/*
 	 * Mask interrupts here.
 	 */
 	mpr_dprint(sc, MPR_INIT, "Masking interrupts and resetting\n");
 	mpr_mask_intr(sc);
 
 	error = mpr_diag_reset(sc, CAN_SLEEP);
 	if (error != 0) {
 		panic("%s hard reset failed with error %d\n", __func__, error);
 	}
 
 	/* Restore the PCI state, including the MSI-X registers */
 	mpr_pci_restore(sc);
 
 	/* Give the I/O subsystem special priority to get itself prepared */
 	mprsas_handle_reinit(sc);
 
 	/*
 	 * Get IOC Facts and allocate all structures based on this information.
 	 * The attach function will also call mpr_iocfacts_allocate at startup.
 	 * If relevant values have changed in IOC Facts, this function will free
 	 * all of the memory based on IOC Facts and reallocate that memory.
 	 */
 	if ((error = mpr_iocfacts_allocate(sc, FALSE)) != 0) {
 		panic("%s IOC Facts based allocation failed with error %d\n",
 		    __func__, error);
 	}
 
 	/*
 	 * Mapping structures will be re-allocated after getting IOC Page8, so
 	 * free these structures here.
 	 */
 	mpr_mapping_exit(sc);
 
 	/*
 	 * The static page function currently read is IOC Page8.  Others can be
 	 * added in future.  It's possible that the values in IOC Page8 have
 	 * changed after a Diag Reset due to user modification, so always read
 	 * these.  Interrupts are masked, so unmask them before getting config
 	 * pages.
 	 */
 	mpr_unmask_intr(sc);
 	sc->mpr_flags &= ~MPR_FLAGS_DIAGRESET;
 	mpr_base_static_config_pages(sc);
 
 	/*
 	 * Some mapping info is based in IOC Page8 data, so re-initialize the
 	 * mapping tables.
 	 */
 	mpr_mapping_initialize(sc);
 
 	/*
 	 * Restart will reload the event masks clobbered by the reset, and
 	 * then enable the port.
 	 */
 	mpr_reregister_events(sc);
 
 	/* the end of discovery will release the simq, so we're done. */
 	mpr_dprint(sc, MPR_INIT|MPR_XINFO, "Finished sc %p post %u free %u\n", 
 	    sc, sc->replypostindex, sc->replyfreeindex);
 	mprsas_release_simq_reinit(sassc);
 	mpr_dprint(sc, MPR_INIT, "%s exit error= %d\n", __func__, error);
 
 	return 0;
 }
 
 /* Wait for the chip to ACK a word that we've put into its FIFO 
  * Wait for <timeout> seconds. In single loop wait for busy loop
  * for 500 microseconds.
  * Total is [ 0.5 * (2000 * <timeout>) ] in miliseconds.
  * */
 static int
 mpr_wait_db_ack(struct mpr_softc *sc, int timeout, int sleep_flag)
 {
 	u32 cntdn, count;
 	u32 int_status;
 	u32 doorbell;
 
 	count = 0;
 	cntdn = (sleep_flag == CAN_SLEEP) ? 1000*timeout : 2000*timeout;
 	do {
 		int_status = mpr_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET);
 		if (!(int_status & MPI2_HIS_SYS2IOC_DB_STATUS)) {
 			mpr_dprint(sc, MPR_TRACE, "%s: successful count(%d), "
 			    "timeout(%d)\n", __func__, count, timeout);
 			return 0;
 		} else if (int_status & MPI2_HIS_IOC2SYS_DB_STATUS) {
 			doorbell = mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 			if ((doorbell & MPI2_IOC_STATE_MASK) ==
 			    MPI2_IOC_STATE_FAULT) {
 				mpr_dprint(sc, MPR_FAULT,
 				    "fault_state(0x%04x)!\n", doorbell);
 				return (EFAULT);
 			}
 		} else if (int_status == 0xFFFFFFFF)
 			goto out;
 			
 		/*
 		 * If it can sleep, sleep for 1 milisecond, else busy loop for
  		 * 0.5 milisecond
 		 */
 		if (mtx_owned(&sc->mpr_mtx) && sleep_flag == CAN_SLEEP)
 			msleep(&sc->msleep_fake_chan, &sc->mpr_mtx, 0, "mprdba",
 			    hz/1000);
 		else if (sleep_flag == CAN_SLEEP)
 			pause("mprdba", hz/1000);
 		else
 			DELAY(500);
 		count++;
 	} while (--cntdn);
 
 out:
 	mpr_dprint(sc, MPR_FAULT, "%s: failed due to timeout count(%d), "
 		"int_status(%x)!\n", __func__, count, int_status);
 	return (ETIMEDOUT);
 }
 
 /* Wait for the chip to signal that the next word in its FIFO can be fetched */
 static int
 mpr_wait_db_int(struct mpr_softc *sc)
 {
 	int retry;
 
 	for (retry = 0; retry < MPR_DB_MAX_WAIT; retry++) {
 		if ((mpr_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET) &
 		    MPI2_HIS_IOC2SYS_DB_STATUS) != 0)
 			return (0);
 		DELAY(2000);
 	}
 	return (ETIMEDOUT);
 }
 
 /* Step through the synchronous command state machine, i.e. "Doorbell mode" */
 static int
 mpr_request_sync(struct mpr_softc *sc, void *req, MPI2_DEFAULT_REPLY *reply,
     int req_sz, int reply_sz, int timeout)
 {
 	uint32_t *data32;
 	uint16_t *data16;
 	int i, count, ioc_sz, residual;
 	int sleep_flags = CAN_SLEEP;
 
 	if (curthread->td_no_sleeping)
 		sleep_flags = NO_SLEEP;
 
 	/* Step 1 */
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/* Step 2 */
 	if (mpr_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED)
 		return (EBUSY);
 
 	/* Step 3
 	 * Announce that a message is coming through the doorbell.  Messages
 	 * are pushed at 32bit words, so round up if needed.
 	 */
 	count = (req_sz + 3) / 4;
 	mpr_regwrite(sc, MPI2_DOORBELL_OFFSET,
 	    (MPI2_FUNCTION_HANDSHAKE << MPI2_DOORBELL_FUNCTION_SHIFT) |
 	    (count << MPI2_DOORBELL_ADD_DWORDS_SHIFT));
 
 	/* Step 4 */
 	if (mpr_wait_db_int(sc) ||
 	    (mpr_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED) == 0) {
 		mpr_dprint(sc, MPR_FAULT, "Doorbell failed to activate\n");
 		return (ENXIO);
 	}
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	if (mpr_wait_db_ack(sc, 5, sleep_flags) != 0) {
 		mpr_dprint(sc, MPR_FAULT, "Doorbell handshake failed\n");
 		return (ENXIO);
 	}
 
 	/* Step 5 */
 	/* Clock out the message data synchronously in 32-bit dwords*/
 	data32 = (uint32_t *)req;
 	for (i = 0; i < count; i++) {
 		mpr_regwrite(sc, MPI2_DOORBELL_OFFSET, htole32(data32[i]));
 		if (mpr_wait_db_ack(sc, 5, sleep_flags) != 0) {
 			mpr_dprint(sc, MPR_FAULT,
 			    "Timeout while writing doorbell\n");
 			return (ENXIO);
 		}
 	}
 
 	/* Step 6 */
 	/* Clock in the reply in 16-bit words.  The total length of the
 	 * message is always in the 4th byte, so clock out the first 2 words
 	 * manually, then loop the rest.
 	 */
 	data16 = (uint16_t *)reply;
 	if (mpr_wait_db_int(sc) != 0) {
 		mpr_dprint(sc, MPR_FAULT, "Timeout reading doorbell 0\n");
 		return (ENXIO);
 	}
 	data16[0] =
 	    mpr_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_DATA_MASK;
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	if (mpr_wait_db_int(sc) != 0) {
 		mpr_dprint(sc, MPR_FAULT, "Timeout reading doorbell 1\n");
 		return (ENXIO);
 	}
 	data16[1] =
 	    mpr_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_DATA_MASK;
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/* Number of 32bit words in the message */
 	ioc_sz = reply->MsgLength;
 
 	/*
 	 * Figure out how many 16bit words to clock in without overrunning.
 	 * The precision loss with dividing reply_sz can safely be
 	 * ignored because the messages can only be multiples of 32bits.
 	 */
 	residual = 0;
 	count = MIN((reply_sz / 4), ioc_sz) * 2;
 	if (count < ioc_sz * 2) {
 		residual = ioc_sz * 2 - count;
 		mpr_dprint(sc, MPR_ERROR, "Driver error, throwing away %d "
 		    "residual message words\n", residual);
 	}
 
 	for (i = 2; i < count; i++) {
 		if (mpr_wait_db_int(sc) != 0) {
 			mpr_dprint(sc, MPR_FAULT,
 			    "Timeout reading doorbell %d\n", i);
 			return (ENXIO);
 		}
 		data16[i] = mpr_regread(sc, MPI2_DOORBELL_OFFSET) &
 		    MPI2_DOORBELL_DATA_MASK;
 		mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	}
 
 	/*
 	 * Pull out residual words that won't fit into the provided buffer.
 	 * This keeps the chip from hanging due to a driver programming
 	 * error.
 	 */
 	while (residual--) {
 		if (mpr_wait_db_int(sc) != 0) {
 			mpr_dprint(sc, MPR_FAULT, "Timeout reading doorbell\n");
 			return (ENXIO);
 		}
 		(void)mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 		mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	}
 
 	/* Step 7 */
 	if (mpr_wait_db_int(sc) != 0) {
 		mpr_dprint(sc, MPR_FAULT, "Timeout waiting to exit doorbell\n");
 		return (ENXIO);
 	}
 	if (mpr_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED)
 		mpr_dprint(sc, MPR_FAULT, "Warning, doorbell still active\n");
 	mpr_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	return (0);
 }
 
 static void
 mpr_enqueue_request(struct mpr_softc *sc, struct mpr_command *cm)
 {
 	request_descriptor rd;
 
 	MPR_FUNCTRACE(sc);
 	mpr_dprint(sc, MPR_TRACE, "SMID %u cm %p ccb %p\n",
 	    cm->cm_desc.Default.SMID, cm, cm->cm_ccb);
 
 	if (sc->mpr_flags & MPR_FLAGS_ATTACH_DONE && !(sc->mpr_flags &
 	    MPR_FLAGS_SHUTDOWN))
 		mtx_assert(&sc->mpr_mtx, MA_OWNED);
 
 	if (++sc->io_cmds_active > sc->io_cmds_highwater)
 		sc->io_cmds_highwater++;
 
 	KASSERT(cm->cm_state == MPR_CM_STATE_BUSY, ("command not busy\n"));
 	cm->cm_state = MPR_CM_STATE_INQUEUE;
 
 	if (sc->atomic_desc_capable) {
 		rd.u.low = cm->cm_desc.Words.Low;
 		mpr_regwrite(sc, MPI26_ATOMIC_REQUEST_DESCRIPTOR_POST_OFFSET,
 		    rd.u.low);
 	} else {
 		rd.u.low = cm->cm_desc.Words.Low;
 		rd.u.high = cm->cm_desc.Words.High;
 		rd.word = htole64(rd.word);
 		mpr_regwrite(sc, MPI2_REQUEST_DESCRIPTOR_POST_LOW_OFFSET,
 		    rd.u.low);
 		mpr_regwrite(sc, MPI2_REQUEST_DESCRIPTOR_POST_HIGH_OFFSET,
 		    rd.u.high);
 	}
 }
 
 /*
  * Just the FACTS, ma'am.
  */
 static int
 mpr_get_iocfacts(struct mpr_softc *sc, MPI2_IOC_FACTS_REPLY *facts)
 {
 	MPI2_DEFAULT_REPLY *reply;
 	MPI2_IOC_FACTS_REQUEST request;
 	int error, req_sz, reply_sz;
 
 	MPR_FUNCTRACE(sc);
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	req_sz = sizeof(MPI2_IOC_FACTS_REQUEST);
 	reply_sz = sizeof(MPI2_IOC_FACTS_REPLY);
 	reply = (MPI2_DEFAULT_REPLY *)facts;
 
 	bzero(&request, req_sz);
 	request.Function = MPI2_FUNCTION_IOC_FACTS;
 	error = mpr_request_sync(sc, &request, reply, req_sz, reply_sz, 5);
 
 	mpr_dprint(sc, MPR_INIT, "%s exit, error= %d\n", __func__, error);
 	return (error);
 }
 
 static int
 mpr_send_iocinit(struct mpr_softc *sc)
 {
 	MPI2_IOC_INIT_REQUEST	init;
 	MPI2_DEFAULT_REPLY	reply;
 	int req_sz, reply_sz, error;
 	struct timeval now;
 	uint64_t time_in_msec;
 
 	MPR_FUNCTRACE(sc);
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	/* Do a quick sanity check on proper initialization */
 	if ((sc->pqdepth == 0) || (sc->fqdepth == 0) || (sc->reqframesz == 0)
 	    || (sc->replyframesz == 0)) {
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "Driver not fully initialized for IOCInit\n");
 		return (EINVAL);
 	}
 
 	req_sz = sizeof(MPI2_IOC_INIT_REQUEST);
 	reply_sz = sizeof(MPI2_IOC_INIT_REPLY);
 	bzero(&init, req_sz);
 	bzero(&reply, reply_sz);
 
 	/*
 	 * Fill in the init block.  Note that most addresses are
 	 * deliberately in the lower 32bits of memory.  This is a micro-
 	 * optimzation for PCI/PCIX, though it's not clear if it helps PCIe.
 	 */
 	init.Function = MPI2_FUNCTION_IOC_INIT;
 	init.WhoInit = MPI2_WHOINIT_HOST_DRIVER;
 	init.MsgVersion = htole16(MPI2_VERSION);
 	init.HeaderVersion = htole16(MPI2_HEADER_VERSION);
 	init.SystemRequestFrameSize = htole16((uint16_t)(sc->reqframesz / 4));
 	init.ReplyDescriptorPostQueueDepth = htole16(sc->pqdepth);
 	init.ReplyFreeQueueDepth = htole16(sc->fqdepth);
 	init.SenseBufferAddressHigh = 0;
 	init.SystemReplyAddressHigh = 0;
 	init.SystemRequestFrameBaseAddress.High = 0;
 	init.SystemRequestFrameBaseAddress.Low =
 	    htole32((uint32_t)sc->req_busaddr);
 	init.ReplyDescriptorPostQueueAddress.High = 0;
 	init.ReplyDescriptorPostQueueAddress.Low =
 	    htole32((uint32_t)sc->post_busaddr);
 	init.ReplyFreeQueueAddress.High = 0;
 	init.ReplyFreeQueueAddress.Low = htole32((uint32_t)sc->free_busaddr);
 	getmicrotime(&now);
 	time_in_msec = (now.tv_sec * 1000 + now.tv_usec/1000);
 	init.TimeStamp.High = htole32((time_in_msec >> 32) & 0xFFFFFFFF);
 	init.TimeStamp.Low = htole32(time_in_msec & 0xFFFFFFFF);
 	init.HostPageSize = HOST_PAGE_SIZE_4K;
 
 	error = mpr_request_sync(sc, &init, &reply, req_sz, reply_sz, 5);
 	if ((reply.IOCStatus & MPI2_IOCSTATUS_MASK) != MPI2_IOCSTATUS_SUCCESS)
 		error = ENXIO;
 
 	mpr_dprint(sc, MPR_INIT, "IOCInit status= 0x%x\n", reply.IOCStatus);
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 	return (error);
 }
 
 void
 mpr_memaddr_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	bus_addr_t *addr;
 
 	addr = arg;
 	*addr = segs[0].ds_addr;
 }
 
 void
 mpr_memaddr_wait_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mpr_busdma_context *ctx;
 	int need_unload, need_free;
 
 	ctx = (struct mpr_busdma_context *)arg;
 	need_unload = 0;
 	need_free = 0;
 
 	mpr_lock(ctx->softc);
 	ctx->error = error;
 	ctx->completed = 1;
 	if ((error == 0) && (ctx->abandoned == 0)) {
 		*ctx->addr = segs[0].ds_addr;
 	} else {
 		if (nsegs != 0)
 			need_unload = 1;
 		if (ctx->abandoned != 0)
 			need_free = 1;
 	}
 	if (need_free == 0)
 		wakeup(ctx);
 
 	mpr_unlock(ctx->softc);
 
 	if (need_unload != 0) {
 		bus_dmamap_unload(ctx->buffer_dmat,
 				  ctx->buffer_dmamap);
 		*ctx->addr = 0;
 	}
 
 	if (need_free != 0)
 		free(ctx, M_MPR);
 }
 
 static int
 mpr_alloc_queues(struct mpr_softc *sc)
 {
 	struct mpr_queue *q;
 	int nq, i;
 
 	nq = sc->msi_msgs;
 	mpr_dprint(sc, MPR_INIT|MPR_XINFO, "Allocating %d I/O queues\n", nq);
 
 	sc->queues = malloc(sizeof(struct mpr_queue) * nq, M_MPR,
 	     M_NOWAIT|M_ZERO);
 	if (sc->queues == NULL)
 		return (ENOMEM);
 
 	for (i = 0; i < nq; i++) {
 		q = &sc->queues[i];
 		mpr_dprint(sc, MPR_INIT, "Configuring queue %d %p\n", i, q);
 		q->sc = sc;
 		q->qnum = i;
 	}
 	return (0);
 }
 
 static int
 mpr_alloc_hw_queues(struct mpr_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	bus_addr_t queues_busaddr;
 	uint8_t *queues;
 	int qsize, fqsize, pqsize;
 
 	/*
 	 * The reply free queue contains 4 byte entries in multiples of 16 and
 	 * aligned on a 16 byte boundary. There must always be an unused entry.
 	 * This queue supplies fresh reply frames for the firmware to use.
 	 *
 	 * The reply descriptor post queue contains 8 byte entries in
 	 * multiples of 16 and aligned on a 16 byte boundary.  This queue
 	 * contains filled-in reply frames sent from the firmware to the host.
 	 *
 	 * These two queues are allocated together for simplicity.
 	 */
 	sc->fqdepth = roundup2(sc->num_replies + 1, 16);
 	sc->pqdepth = roundup2(sc->num_replies + 1, 16);
 	fqsize= sc->fqdepth * 4;
 	pqsize = sc->pqdepth * 8;
 	qsize = fqsize + pqsize;
 
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.alignment = 16;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = qsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(16), BD_MAXSIZE(qsize),
+	    BD_MAXSEGSIZE(qsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->queues_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate queues DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->queues_dmat, (void **)&queues, BUS_DMA_NOWAIT,
 	    &sc->queues_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate queues memory\n");
 		return (ENOMEM);
         }
         bzero(queues, qsize);
         bus_dmamap_load(sc->queues_dmat, sc->queues_map, queues, qsize,
 	    mpr_memaddr_cb, &queues_busaddr, 0);
 
 	sc->free_queue = (uint32_t *)queues;
 	sc->free_busaddr = queues_busaddr;
 	sc->post_queue = (MPI2_REPLY_DESCRIPTORS_UNION *)(queues + fqsize);
 	sc->post_busaddr = queues_busaddr + fqsize;
 	mpr_dprint(sc, MPR_INIT, "free queue busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->free_busaddr, fqsize);
 	mpr_dprint(sc, MPR_INIT, "reply queue busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->post_busaddr, pqsize);
 
 	return (0);
 }
 
 static int
 mpr_alloc_replies(struct mpr_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	int rsize, num_replies;
 
 	/* Store the reply frame size in bytes rather than as 32bit words */
 	sc->replyframesz = sc->facts->ReplyFrameSize * 4;
 
 	/*
 	 * sc->num_replies should be one less than sc->fqdepth.  We need to
 	 * allocate space for sc->fqdepth replies, but only sc->num_replies
 	 * replies can be used at once.
 	 */
 	num_replies = max(sc->fqdepth, sc->num_replies);
 
 	rsize = sc->replyframesz * num_replies; 
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.alignment = 4;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(4), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->reply_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate replies DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->reply_dmat, (void **)&sc->reply_frames,
 	    BUS_DMA_NOWAIT, &sc->reply_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate replies memory\n");
 		return (ENOMEM);
         }
         bzero(sc->reply_frames, rsize);
         bus_dmamap_load(sc->reply_dmat, sc->reply_map, sc->reply_frames, rsize,
 	    mpr_memaddr_cb, &sc->reply_busaddr, 0);
 	mpr_dprint(sc, MPR_INIT, "reply frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->reply_busaddr, rsize);
 
 	return (0);
 }
 
 static void
 mpr_load_chains_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mpr_softc *sc = arg;
 	struct mpr_chain *chain;
 	bus_size_t bo;
 	int i, o, s;
 
 	if (error != 0)
 		return;
 
 	for (i = 0, o = 0, s = 0; s < nsegs; s++) {
 		for (bo = 0; bo + sc->chain_frame_size <= segs[s].ds_len;
 		    bo += sc->chain_frame_size) {
 			chain = &sc->chains[i++];
 			chain->chain =(MPI2_SGE_IO_UNION *)(sc->chain_frames+o);
 			chain->chain_busaddr = segs[s].ds_addr + bo;
 			o += sc->chain_frame_size;
 			mpr_free_chain(sc, chain);
 		}
 		if (bo != segs[s].ds_len)
 			o += segs[s].ds_len - bo;
 	}
 	sc->chain_free_lowwater = i;
 }
 
 static int
 mpr_alloc_requests(struct mpr_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	struct mpr_command *cm;
 	int i, rsize, nsegs;
 
 	rsize = sc->reqframesz * sc->num_reqs;
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.alignment = 16;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(16), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->req_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate request DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->req_dmat, (void **)&sc->req_frames,
 	    BUS_DMA_NOWAIT, &sc->req_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate request memory\n");
 		return (ENOMEM);
         }
         bzero(sc->req_frames, rsize);
         bus_dmamap_load(sc->req_dmat, sc->req_map, sc->req_frames, rsize,
 	    mpr_memaddr_cb, &sc->req_busaddr, 0);
 	mpr_dprint(sc, MPR_INIT, "request frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->req_busaddr, rsize);
 
 	sc->chains = malloc(sizeof(struct mpr_chain) * sc->num_chains, M_MPR,
 	    M_NOWAIT | M_ZERO);
 	if (!sc->chains) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate chain memory\n");
 		return (ENOMEM);
 	}
 	rsize = sc->chain_frame_size * sc->num_chains;
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.alignment = 16;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = howmany(rsize, PAGE_SIZE);
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(16), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS((howmany(rsize, PAGE_SIZE))));
 	if (bus_dma_template_tag(&t, &sc->chain_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate chain DMA tag\n");
 		return (ENOMEM);
 	}
 	if (bus_dmamem_alloc(sc->chain_dmat, (void **)&sc->chain_frames,
 	    BUS_DMA_NOWAIT | BUS_DMA_ZERO, &sc->chain_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate chain memory\n");
 		return (ENOMEM);
 	}
 	if (bus_dmamap_load(sc->chain_dmat, sc->chain_map, sc->chain_frames,
 	    rsize, mpr_load_chains_cb, sc, BUS_DMA_NOWAIT)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot load chain memory\n");
 		bus_dmamem_free(sc->chain_dmat, sc->chain_frames,
 		    sc->chain_map);
 		return (ENOMEM);
 	}
 
 	rsize = MPR_SENSE_LEN * sc->num_reqs;
 	bus_dma_template_clone(&t, sc->req_dmat);
-	t.maxsize = t.maxsegsize = rsize;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(1), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize));
 	if (bus_dma_template_tag(&t, &sc->sense_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate sense DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->sense_dmat, (void **)&sc->sense_frames,
 	    BUS_DMA_NOWAIT, &sc->sense_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate sense memory\n");
 		return (ENOMEM);
         }
         bzero(sc->sense_frames, rsize);
         bus_dmamap_load(sc->sense_dmat, sc->sense_map, sc->sense_frames, rsize,
 	    mpr_memaddr_cb, &sc->sense_busaddr, 0);
 	mpr_dprint(sc, MPR_INIT, "sense frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->sense_busaddr, rsize);
 
 	/*
 	 * Allocate NVMe PRP Pages for NVMe SGL support only if the FW supports
 	 * these devices.
 	 */
 	if ((sc->facts->MsgVersion >= MPI2_VERSION_02_06) &&
 	    (sc->facts->ProtocolFlags & MPI2_IOCFACTS_PROTOCOL_NVME_DEVICES)) {
 		if (mpr_alloc_nvme_prp_pages(sc) == ENOMEM)
 			return (ENOMEM);
 	}
 
 	nsegs = (sc->maxio / PAGE_SIZE) + 1;
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.nsegments = nsegs;
-	t.flags = BUS_DMA_ALLOCNOW;
-	t.lockfunc = busdma_lock_mutex;
-	t.lockfuncarg = &sc->mpr_mtx;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_MAXSIZE(BUS_SPACE_MAXSIZE_32BIT),
+	    BD_NSEGMENTS(nsegs), BD_MAXSEGSIZE(BUS_SPACE_MAXSIZE_32BIT),
+	    BD_FLAGS(BUS_DMA_ALLOCNOW), BD_LOCKFUNC(busdma_lock_mutex),
+	    BD_LOCKFUNCARG(&sc->mpr_mtx));
 	if (bus_dma_template_tag(&t, &sc->buffer_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate buffer DMA tag\n");
 		return (ENOMEM);
         }
 
 	/*
 	 * SMID 0 cannot be used as a free command per the firmware spec.
 	 * Just drop that command instead of risking accounting bugs.
 	 */
 	sc->commands = malloc(sizeof(struct mpr_command) * sc->num_reqs,
 	    M_MPR, M_WAITOK | M_ZERO);
 	for (i = 1; i < sc->num_reqs; i++) {
 		cm = &sc->commands[i];
 		cm->cm_req = sc->req_frames + i * sc->reqframesz;
 		cm->cm_req_busaddr = sc->req_busaddr + i * sc->reqframesz;
 		cm->cm_sense = &sc->sense_frames[i];
 		cm->cm_sense_busaddr = sc->sense_busaddr + i * MPR_SENSE_LEN;
 		cm->cm_desc.Default.SMID = i;
 		cm->cm_sc = sc;
 		cm->cm_state = MPR_CM_STATE_BUSY;
 		TAILQ_INIT(&cm->cm_chain_list);
 		TAILQ_INIT(&cm->cm_prp_page_list);
 		callout_init_mtx(&cm->cm_callout, &sc->mpr_mtx, 0);
 
 		/* XXX Is a failure here a critical problem? */
 		if (bus_dmamap_create(sc->buffer_dmat, 0, &cm->cm_dmamap)
 		    == 0) {
 			if (i <= sc->num_prireqs)
 				mpr_free_high_priority_command(sc, cm);
 			else
 				mpr_free_command(sc, cm);
 		} else {
 			panic("failed to allocate command %d\n", i);
 			sc->num_reqs = i;
 			break;
 		}
 	}
 
 	return (0);
 }
 
 /*
  * Allocate contiguous buffers for PCIe NVMe devices for building native PRPs,
  * which are scatter/gather lists for NVMe devices. 
  *
  * This buffer must be contiguous due to the nature of how NVMe PRPs are built
  * and translated by FW.
  *
  * returns ENOMEM if memory could not be allocated, otherwise returns 0.
  */
 static int
 mpr_alloc_nvme_prp_pages(struct mpr_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	struct mpr_prp_page *prp_page;
 	int PRPs_per_page, PRPs_required, pages_required;
 	int rsize, i;
 
 	/*
 	 * Assuming a MAX_IO_SIZE of 1MB and a PAGE_SIZE of 4k, the max number
 	 * of PRPs (NVMe's Scatter/Gather Element) needed per I/O is:
 	 * MAX_IO_SIZE / PAGE_SIZE = 256
 	 * 
 	 * 1 PRP entry in main frame for PRP list pointer still leaves 255 PRPs
 	 * required for the remainder of the 1MB I/O. 512 PRPs can fit into one
 	 * page (4096 / 8 = 512), so only one page is required for each I/O.
 	 *
 	 * Each of these buffers will need to be contiguous. For simplicity,
 	 * only one buffer is allocated here, which has all of the space
 	 * required for the NVMe Queue Depth. If there are problems allocating
 	 * this one buffer, this function will need to change to allocate
 	 * individual, contiguous NVME_QDEPTH buffers.
 	 *
 	 * The real calculation will use the real max io size. Above is just an
 	 * example.
 	 *
 	 */
 	PRPs_required = sc->maxio / PAGE_SIZE;
 	PRPs_per_page = (PAGE_SIZE / PRP_ENTRY_SIZE) - 1;
 	pages_required = (PRPs_required / PRPs_per_page) + 1;
 
 	sc->prp_buffer_size = PAGE_SIZE * pages_required; 
 	rsize = sc->prp_buffer_size * NVME_QDEPTH; 
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.alignment = 4;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(4), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->prp_page_dmat)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate NVMe PRP DMA "
 		    "tag\n");
 		return (ENOMEM);
 	}
 	if (bus_dmamem_alloc(sc->prp_page_dmat, (void **)&sc->prp_pages,
 	    BUS_DMA_NOWAIT, &sc->prp_page_map)) {
 		mpr_dprint(sc, MPR_ERROR, "Cannot allocate NVMe PRP memory\n");
 		return (ENOMEM);
 	}
 	bzero(sc->prp_pages, rsize);
 	bus_dmamap_load(sc->prp_page_dmat, sc->prp_page_map, sc->prp_pages,
 	    rsize, mpr_memaddr_cb, &sc->prp_page_busaddr, 0);
 
 	sc->prps = malloc(sizeof(struct mpr_prp_page) * NVME_QDEPTH, M_MPR,
 	    M_WAITOK | M_ZERO);
 	for (i = 0; i < NVME_QDEPTH; i++) {
 		prp_page = &sc->prps[i];
 		prp_page->prp_page = (uint64_t *)(sc->prp_pages +
 		    i * sc->prp_buffer_size);
 		prp_page->prp_page_busaddr = (uint64_t)(sc->prp_page_busaddr +
 		    i * sc->prp_buffer_size);
 		mpr_free_prp_page(sc, prp_page);
 		sc->prp_pages_free_lowwater++;
 	}
 
 	return (0);
 }
 
 static int
 mpr_init_queues(struct mpr_softc *sc)
 {
 	int i;
 
 	memset((uint8_t *)sc->post_queue, 0xff, sc->pqdepth * 8);
 
 	/*
 	 * According to the spec, we need to use one less reply than we
 	 * have space for on the queue.  So sc->num_replies (the number we
 	 * use) should be less than sc->fqdepth (allocated size).
 	 */
 	if (sc->num_replies >= sc->fqdepth)
 		return (EINVAL);
 
 	/*
 	 * Initialize all of the free queue entries.
 	 */
 	for (i = 0; i < sc->fqdepth; i++) {
 		sc->free_queue[i] = sc->reply_busaddr + (i * sc->replyframesz);
 	}
 	sc->replyfreeindex = sc->num_replies;
 
 	return (0);
 }
 
 /* Get the driver parameter tunables.  Lowest priority are the driver defaults.
  * Next are the global settings, if they exist.  Highest are the per-unit
  * settings, if they exist.
  */
 void
 mpr_get_tunables(struct mpr_softc *sc)
 {
 	char tmpstr[80], mpr_debug[80];
 
 	/* XXX default to some debugging for now */
 	sc->mpr_debug = MPR_INFO | MPR_FAULT;
 	sc->disable_msix = 0;
 	sc->disable_msi = 0;
 	sc->max_msix = MPR_MSIX_MAX;
 	sc->max_chains = MPR_CHAIN_FRAMES;
 	sc->max_io_pages = MPR_MAXIO_PAGES;
 	sc->enable_ssu = MPR_SSU_ENABLE_SSD_DISABLE_HDD;
 	sc->spinup_wait_time = DEFAULT_SPINUP_WAIT;
 	sc->use_phynum = 1;
 	sc->max_reqframes = MPR_REQ_FRAMES;
 	sc->max_prireqframes = MPR_PRI_REQ_FRAMES;
 	sc->max_replyframes = MPR_REPLY_FRAMES;
 	sc->max_evtframes = MPR_EVT_REPLY_FRAMES;
 
 	/*
 	 * Grab the global variables.
 	 */
 	bzero(mpr_debug, 80);
 	if (TUNABLE_STR_FETCH("hw.mpr.debug_level", mpr_debug, 80) != 0)
 		mpr_parse_debug(sc, mpr_debug);
 	TUNABLE_INT_FETCH("hw.mpr.disable_msix", &sc->disable_msix);
 	TUNABLE_INT_FETCH("hw.mpr.disable_msi", &sc->disable_msi);
 	TUNABLE_INT_FETCH("hw.mpr.max_msix", &sc->max_msix);
 	TUNABLE_INT_FETCH("hw.mpr.max_chains", &sc->max_chains);
 	TUNABLE_INT_FETCH("hw.mpr.max_io_pages", &sc->max_io_pages);
 	TUNABLE_INT_FETCH("hw.mpr.enable_ssu", &sc->enable_ssu);
 	TUNABLE_INT_FETCH("hw.mpr.spinup_wait_time", &sc->spinup_wait_time);
 	TUNABLE_INT_FETCH("hw.mpr.use_phy_num", &sc->use_phynum);
 	TUNABLE_INT_FETCH("hw.mpr.max_reqframes", &sc->max_reqframes);
 	TUNABLE_INT_FETCH("hw.mpr.max_prireqframes", &sc->max_prireqframes);
 	TUNABLE_INT_FETCH("hw.mpr.max_replyframes", &sc->max_replyframes);
 	TUNABLE_INT_FETCH("hw.mpr.max_evtframes", &sc->max_evtframes);
 
 	/* Grab the unit-instance variables */
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.debug_level",
 	    device_get_unit(sc->mpr_dev));
 	bzero(mpr_debug, 80);
 	if (TUNABLE_STR_FETCH(tmpstr, mpr_debug, 80) != 0)
 		mpr_parse_debug(sc, mpr_debug);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.disable_msix",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->disable_msix);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.disable_msi",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->disable_msi);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_msix",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_msix);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_chains",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_chains);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_io_pages",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_io_pages);
 
 	bzero(sc->exclude_ids, sizeof(sc->exclude_ids));
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.exclude_ids",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_STR_FETCH(tmpstr, sc->exclude_ids, sizeof(sc->exclude_ids));
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.enable_ssu",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->enable_ssu);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.spinup_wait_time",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->spinup_wait_time);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.use_phy_num",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->use_phynum);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_reqframes",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_reqframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_prireqframes",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_prireqframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_replyframes",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_replyframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mpr.%d.max_evtframes",
 	    device_get_unit(sc->mpr_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_evtframes);
 }
 
 static void
 mpr_setup_sysctl(struct mpr_softc *sc)
 {
 	struct sysctl_ctx_list	*sysctl_ctx = NULL;
 	struct sysctl_oid	*sysctl_tree = NULL;
 	char tmpstr[80], tmpstr2[80];
 
 	/*
 	 * Setup the sysctl variable so the user can change the debug level
 	 * on the fly.
 	 */
 	snprintf(tmpstr, sizeof(tmpstr), "MPR controller %d",
 	    device_get_unit(sc->mpr_dev));
 	snprintf(tmpstr2, sizeof(tmpstr2), "%d", device_get_unit(sc->mpr_dev));
 
 	sysctl_ctx = device_get_sysctl_ctx(sc->mpr_dev);
 	if (sysctl_ctx != NULL)
 		sysctl_tree = device_get_sysctl_tree(sc->mpr_dev);
 
 	if (sysctl_tree == NULL) {
 		sysctl_ctx_init(&sc->sysctl_ctx);
 		sc->sysctl_tree = SYSCTL_ADD_NODE(&sc->sysctl_ctx,
 		    SYSCTL_STATIC_CHILDREN(_hw_mpr), OID_AUTO, tmpstr2,
 		    CTLFLAG_RD | CTLFLAG_MPSAFE, 0, tmpstr);
 		if (sc->sysctl_tree == NULL)
 			return;
 		sysctl_ctx = &sc->sysctl_ctx;
 		sysctl_tree = sc->sysctl_tree;
 	}
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "debug_level", CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_MPSAFE,
 	    sc, 0, mpr_debug_sysctl, "A", "mpr debug level");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "disable_msix", CTLFLAG_RD, &sc->disable_msix, 0,
 	    "Disable the use of MSI-X interrupts");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_msix", CTLFLAG_RD, &sc->max_msix, 0,
 	    "User-defined maximum number of MSIX queues");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "msix_msgs", CTLFLAG_RD, &sc->msi_msgs, 0,
 	    "Negotiated number of MSIX queues");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_reqframes", CTLFLAG_RD, &sc->max_reqframes, 0,
 	    "Total number of allocated request frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_prireqframes", CTLFLAG_RD, &sc->max_prireqframes, 0,
 	    "Total number of allocated high priority request frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_replyframes", CTLFLAG_RD, &sc->max_replyframes, 0,
 	    "Total number of allocated reply frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_evtframes", CTLFLAG_RD, &sc->max_evtframes, 0,
 	    "Total number of event frames allocated");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "firmware_version", CTLFLAG_RD, sc->fw_version,
 	    strlen(sc->fw_version), "firmware version");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "driver_version", CTLFLAG_RD, MPR_DRIVER_VERSION,
 	    strlen(MPR_DRIVER_VERSION), "driver version");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "msg_version", CTLFLAG_RD, sc->msg_version,
 	    strlen(sc->msg_version), "message interface version");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "io_cmds_active", CTLFLAG_RD,
 	    &sc->io_cmds_active, 0, "number of currently active commands");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "io_cmds_highwater", CTLFLAG_RD,
 	    &sc->io_cmds_highwater, 0, "maximum active commands seen");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_free", CTLFLAG_RD,
 	    &sc->chain_free, 0, "number of free chain elements");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_free_lowwater", CTLFLAG_RD,
 	    &sc->chain_free_lowwater, 0,"lowest number of free chain elements");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_chains", CTLFLAG_RD,
 	    &sc->max_chains, 0,"maximum chain frames that will be allocated");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_io_pages", CTLFLAG_RD,
 	    &sc->max_io_pages, 0,"maximum pages to allow per I/O (if <1 use "
 	    "IOCFacts)");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "enable_ssu", CTLFLAG_RW, &sc->enable_ssu, 0,
 	    "enable SSU to SATA SSD/HDD at shutdown");
 
 	SYSCTL_ADD_UQUAD(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_alloc_fail", CTLFLAG_RD,
 	    &sc->chain_alloc_fail, "chain allocation failures");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "spinup_wait_time", CTLFLAG_RD,
 	    &sc->spinup_wait_time, DEFAULT_SPINUP_WAIT, "seconds to wait for "
 	    "spinup after SATA ID error");
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "dump_reqs",
 	    CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_SKIP | CTLFLAG_NEEDGIANT,
 	    sc, 0, mpr_dump_reqs, "I", "Dump Active Requests");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "use_phy_num", CTLFLAG_RD, &sc->use_phynum, 0,
 	    "Use the phy number for enumeration");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "prp_pages_free", CTLFLAG_RD,
 	    &sc->prp_pages_free, 0, "number of free PRP pages");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "prp_pages_free_lowwater", CTLFLAG_RD,
 	    &sc->prp_pages_free_lowwater, 0,"lowest number of free PRP pages");
 
 	SYSCTL_ADD_UQUAD(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "prp_page_alloc_fail", CTLFLAG_RD,
 	    &sc->prp_page_alloc_fail, "PRP page allocation failures");
 }
 
 static struct mpr_debug_string {
 	char *name;
 	int flag;
 } mpr_debug_strings[] = {
 	{"info", MPR_INFO},
 	{"fault", MPR_FAULT},
 	{"event", MPR_EVENT},
 	{"log", MPR_LOG},
 	{"recovery", MPR_RECOVERY},
 	{"error", MPR_ERROR},
 	{"init", MPR_INIT},
 	{"xinfo", MPR_XINFO},
 	{"user", MPR_USER},
 	{"mapping", MPR_MAPPING},
 	{"trace", MPR_TRACE}
 };
 
 enum mpr_debug_level_combiner {
 	COMB_NONE,
 	COMB_ADD,
 	COMB_SUB
 };
 
 static int
 mpr_debug_sysctl(SYSCTL_HANDLER_ARGS)
 {
 	struct mpr_softc *sc;
 	struct mpr_debug_string *string;
 	struct sbuf *sbuf;
 	char *buffer;
 	size_t sz;
 	int i, len, debug, error;
 
 	sc = (struct mpr_softc *)arg1;
 
 	error = sysctl_wire_old_buffer(req, 0);
 	if (error != 0)
 		return (error);
 
 	sbuf = sbuf_new_for_sysctl(NULL, NULL, 128, req);
 	debug = sc->mpr_debug;
 
 	sbuf_printf(sbuf, "%#x", debug);
 
 	sz = sizeof(mpr_debug_strings) / sizeof(mpr_debug_strings[0]);
 	for (i = 0; i < sz; i++) {
 		string = &mpr_debug_strings[i];
 		if (debug & string->flag) 
 			sbuf_printf(sbuf, ",%s", string->name);
 	}
 
 	error = sbuf_finish(sbuf);
 	sbuf_delete(sbuf);
 
 	if (error || req->newptr == NULL)
 		return (error);
 
 	len = req->newlen - req->newidx;
 	if (len == 0)
 		return (0);
 
 	buffer = malloc(len, M_MPR, M_ZERO|M_WAITOK);
 	error = SYSCTL_IN(req, buffer, len);
 
 	mpr_parse_debug(sc, buffer);
 
 	free(buffer, M_MPR);
 	return (error);
 }
 
 static void
 mpr_parse_debug(struct mpr_softc *sc, char *list)
 {
 	struct mpr_debug_string *string;
 	enum mpr_debug_level_combiner op;
 	char *token, *endtoken;
 	size_t sz;
 	int flags, i;
 
 	if (list == NULL || *list == '\0')
 		return;
 
 	if (*list == '+') {
 		op = COMB_ADD;
 		list++;
 	} else if (*list == '-') {
 		op = COMB_SUB;
 		list++;
 	} else
 		op = COMB_NONE;
 	if (*list == '\0')
 		return;
 
 	flags = 0;
 	sz = sizeof(mpr_debug_strings) / sizeof(mpr_debug_strings[0]);
 	while ((token = strsep(&list, ":,")) != NULL) {
 		/* Handle integer flags */
 		flags |= strtol(token, &endtoken, 0);
 		if (token != endtoken)
 			continue;
 
 		/* Handle text flags */
 		for (i = 0; i < sz; i++) {
 			string = &mpr_debug_strings[i];
 			if (strcasecmp(token, string->name) == 0) {
 				flags |= string->flag;
 				break;
 			}
 		}
 	}
 
 	switch (op) {
 	case COMB_NONE:
 		sc->mpr_debug = flags;
 		break;
 	case COMB_ADD:
 		sc->mpr_debug |= flags;
 		break;
 	case COMB_SUB:
 		sc->mpr_debug &= (~flags);
 		break;
 	}
 	return;
 }
 
 struct mpr_dumpreq_hdr {
 	uint32_t	smid;
 	uint32_t	state;
 	uint32_t	numframes;
 	uint32_t	deschi;
 	uint32_t	desclo;
 };
 
 static int
 mpr_dump_reqs(SYSCTL_HANDLER_ARGS)
 {
 	struct mpr_softc *sc;
 	struct mpr_chain *chain, *chain1;
 	struct mpr_command *cm;
 	struct mpr_dumpreq_hdr hdr;
 	struct sbuf *sb;
 	uint32_t smid, state;
 	int i, numreqs, error = 0;
 
 	sc = (struct mpr_softc *)arg1;
 
 	if ((error = priv_check(curthread, PRIV_DRIVER)) != 0) {
 		printf("priv check error %d\n", error);
 		return (error);
 	}
 
 	state = MPR_CM_STATE_INQUEUE;
 	smid = 1;
 	numreqs = sc->num_reqs;
 
 	if (req->newptr != NULL)
 		return (EINVAL);
 
 	if (smid == 0 || smid > sc->num_reqs)
 		return (EINVAL);
 	if (numreqs <= 0 || (numreqs + smid > sc->num_reqs))
 		numreqs = sc->num_reqs;
 	sb = sbuf_new_for_sysctl(NULL, NULL, 4096, req);
 
 	/* Best effort, no locking */
 	for (i = smid; i < numreqs; i++) {
 		cm = &sc->commands[i];
 		if (cm->cm_state != state)
 			continue;
 		hdr.smid = i;
 		hdr.state = cm->cm_state;
 		hdr.numframes = 1;
 		hdr.deschi = cm->cm_desc.Words.High;
 		hdr.desclo = cm->cm_desc.Words.Low;
 		TAILQ_FOREACH_SAFE(chain, &cm->cm_chain_list, chain_link,
 		   chain1)
 			hdr.numframes++;
 		sbuf_bcat(sb, &hdr, sizeof(hdr));
 		sbuf_bcat(sb, cm->cm_req, 128);
 		TAILQ_FOREACH_SAFE(chain, &cm->cm_chain_list, chain_link,
 		    chain1)
 			sbuf_bcat(sb, chain->chain, 128);
 	}
 
 	error = sbuf_finish(sb);
 	sbuf_delete(sb);
 	return (error);
 }
 
 int
 mpr_attach(struct mpr_softc *sc)
 {
 	int error;
 
 	MPR_FUNCTRACE(sc);
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	mtx_init(&sc->mpr_mtx, "MPR lock", NULL, MTX_DEF);
 	callout_init_mtx(&sc->periodic, &sc->mpr_mtx, 0);
 	callout_init_mtx(&sc->device_check_callout, &sc->mpr_mtx, 0);
 	TAILQ_INIT(&sc->event_list);
 	timevalclear(&sc->lastfail);
 
 	if ((error = mpr_transition_ready(sc)) != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 		    "Failed to transition ready\n");
 		return (error);
 	}
 
 	sc->facts = malloc(sizeof(MPI2_IOC_FACTS_REPLY), M_MPR,
 	    M_ZERO|M_NOWAIT);
 	if (!sc->facts) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT,
 		    "Cannot allocate memory, exit\n");
 		return (ENOMEM);
 	}
 
 	/*
 	 * Get IOC Facts and allocate all structures based on this information.
 	 * A Diag Reset will also call mpr_iocfacts_allocate and re-read the IOC
 	 * Facts. If relevant values have changed in IOC Facts, this function
 	 * will free all of the memory based on IOC Facts and reallocate that
 	 * memory.  If this fails, any allocated memory should already be freed.
 	 */
 	if ((error = mpr_iocfacts_allocate(sc, TRUE)) != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT, "IOC Facts allocation "
 		    "failed with error %d\n", error);
 		return (error);
 	}
 
 	/* Start the periodic watchdog check on the IOC Doorbell */
 	mpr_periodic(sc);
 
 	/*
 	 * The portenable will kick off discovery events that will drive the
 	 * rest of the initialization process.  The CAM/SAS module will
 	 * hold up the boot sequence until discovery is complete.
 	 */
 	sc->mpr_ich.ich_func = mpr_startup;
 	sc->mpr_ich.ich_arg = sc;
 	if (config_intrhook_establish(&sc->mpr_ich) != 0) {
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "Cannot establish MPR config hook\n");
 		error = EINVAL;
 	}
 
 	/*
 	 * Allow IR to shutdown gracefully when shutdown occurs.
 	 */
 	sc->shutdown_eh = EVENTHANDLER_REGISTER(shutdown_final,
 	    mprsas_ir_shutdown, sc, SHUTDOWN_PRI_DEFAULT);
 
 	if (sc->shutdown_eh == NULL)
 		mpr_dprint(sc, MPR_INIT|MPR_ERROR,
 		    "shutdown event registration failed\n");
 
 	mpr_setup_sysctl(sc);
 
 	sc->mpr_flags |= MPR_FLAGS_ATTACH_DONE;
 	mpr_dprint(sc, MPR_INIT, "%s exit error= %d\n", __func__, error);
 
 	return (error);
 }
 
 /* Run through any late-start handlers. */
 static void
 mpr_startup(void *arg)
 {
 	struct mpr_softc *sc;
 
 	sc = (struct mpr_softc *)arg;
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 
 	mpr_lock(sc);
 	mpr_unmask_intr(sc);
 
 	/* initialize device mapping tables */
 	mpr_base_static_config_pages(sc);
 	mpr_mapping_initialize(sc);
 	mprsas_startup(sc);
 	mpr_unlock(sc);
 
 	mpr_dprint(sc, MPR_INIT, "disestablish config intrhook\n");
 	config_intrhook_disestablish(&sc->mpr_ich);
 	sc->mpr_ich.ich_arg = NULL;
 
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 }
 
 /* Periodic watchdog.  Is called with the driver lock already held. */
 static void
 mpr_periodic(void *arg)
 {
 	struct mpr_softc *sc;
 	uint32_t db;
 
 	sc = (struct mpr_softc *)arg;
 	if (sc->mpr_flags & MPR_FLAGS_SHUTDOWN)
 		return;
 
 	db = mpr_regread(sc, MPI2_DOORBELL_OFFSET);
 	if ((db & MPI2_IOC_STATE_MASK) == MPI2_IOC_STATE_FAULT) {
 		if ((db & MPI2_DOORBELL_FAULT_CODE_MASK) ==
 		    IFAULT_IOP_OVER_TEMP_THRESHOLD_EXCEEDED) {
 			panic("TEMPERATURE FAULT: STOPPING.");
 		}
 		mpr_dprint(sc, MPR_FAULT, "IOC Fault 0x%08x, Resetting\n", db);
 		mpr_reinit(sc);
 	}
 
 	callout_reset(&sc->periodic, MPR_PERIODIC_DELAY * hz, mpr_periodic, sc);
 }
 
 static void
 mpr_log_evt_handler(struct mpr_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *event)
 {
 	MPI2_EVENT_DATA_LOG_ENTRY_ADDED *entry;
 
 	MPR_DPRINT_EVENT(sc, generic, event);
 
 	switch (event->Event) {
 	case MPI2_EVENT_LOG_DATA:
 		mpr_dprint(sc, MPR_EVENT, "MPI2_EVENT_LOG_DATA:\n");
 		if (sc->mpr_debug & MPR_EVENT)
 			hexdump(event->EventData, event->EventDataLength, NULL,
 			    0);
 		break;
 	case MPI2_EVENT_LOG_ENTRY_ADDED:
 		entry = (MPI2_EVENT_DATA_LOG_ENTRY_ADDED *)event->EventData;
 		mpr_dprint(sc, MPR_EVENT, "MPI2_EVENT_LOG_ENTRY_ADDED event "
 		    "0x%x Sequence %d:\n", entry->LogEntryQualifier,
 		     entry->LogSequence);
 		break;
 	default:
 		break;
 	}
 	return;
 }
 
 static int
 mpr_attach_log(struct mpr_softc *sc)
 {
 	uint8_t events[16];
 
 	bzero(events, 16);
 	setbit(events, MPI2_EVENT_LOG_DATA);
 	setbit(events, MPI2_EVENT_LOG_ENTRY_ADDED);
 
 	mpr_register_events(sc, events, mpr_log_evt_handler, NULL,
 	    &sc->mpr_log_eh);
 
 	return (0);
 }
 
 static int
 mpr_detach_log(struct mpr_softc *sc)
 {
 
 	if (sc->mpr_log_eh != NULL)
 		mpr_deregister_events(sc, sc->mpr_log_eh);
 	return (0);
 }
 
 /*
  * Free all of the driver resources and detach submodules.  Should be called
  * without the lock held.
  */
 int
 mpr_free(struct mpr_softc *sc)
 {
 	int error;
 
 	mpr_dprint(sc, MPR_INIT, "%s entered\n", __func__);
 	/* Turn off the watchdog */
 	mpr_lock(sc);
 	sc->mpr_flags |= MPR_FLAGS_SHUTDOWN;
 	mpr_unlock(sc);
 	/* Lock must not be held for this */
 	callout_drain(&sc->periodic);
 	callout_drain(&sc->device_check_callout);
 
 	if (((error = mpr_detach_log(sc)) != 0) ||
 	    ((error = mpr_detach_sas(sc)) != 0)) {
 		mpr_dprint(sc, MPR_INIT|MPR_FAULT, "failed to detach "
 		    "subsystems, error= %d, exit\n", error);
 		return (error);
 	}
 
 	mpr_detach_user(sc);
 
 	/* Put the IOC back in the READY state. */
 	mpr_lock(sc);
 	if ((error = mpr_transition_ready(sc)) != 0) {
 		mpr_unlock(sc);
 		return (error);
 	}
 	mpr_unlock(sc);
 
 	if (sc->facts != NULL)
 		free(sc->facts, M_MPR);
 
 	/*
 	 * Free all buffers that are based on IOC Facts.  A Diag Reset may need
 	 * to free these buffers too.
 	 */
 	mpr_iocfacts_free(sc);
 
 	if (sc->sysctl_tree != NULL)
 		sysctl_ctx_free(&sc->sysctl_ctx);
 
 	/* Deregister the shutdown function */
 	if (sc->shutdown_eh != NULL)
 		EVENTHANDLER_DEREGISTER(shutdown_final, sc->shutdown_eh);
 
 	mtx_destroy(&sc->mpr_mtx);
 	mpr_dprint(sc, MPR_INIT, "%s exit\n", __func__);
 
 	return (0);
 }
 
 static __inline void
 mpr_complete_command(struct mpr_softc *sc, struct mpr_command *cm)
 {
 	MPR_FUNCTRACE(sc);
 
 	if (cm == NULL) {
 		mpr_dprint(sc, MPR_ERROR, "Completing NULL command\n");
 		return;
 	}
 
 	cm->cm_state = MPR_CM_STATE_BUSY;
 	if (cm->cm_flags & MPR_CM_FLAGS_POLLED)
 		cm->cm_flags |= MPR_CM_FLAGS_COMPLETE;
 
 	if (cm->cm_complete != NULL) {
 		mpr_dprint(sc, MPR_TRACE,
 		    "%s cm %p calling cm_complete %p data %p reply %p\n",
 		    __func__, cm, cm->cm_complete, cm->cm_complete_data,
 		    cm->cm_reply);
 		cm->cm_complete(sc, cm);
 	}
 
 	if (cm->cm_flags & MPR_CM_FLAGS_WAKEUP) {
 		mpr_dprint(sc, MPR_TRACE, "waking up %p\n", cm);
 		wakeup(cm);
 	}
 
 	if (sc->io_cmds_active != 0) {
 		sc->io_cmds_active--;
 	} else {
 		mpr_dprint(sc, MPR_ERROR, "Warning: io_cmds_active is "
 		    "out of sync - resynching to 0\n");
 	}
 }
 
 static void
 mpr_sas_log_info(struct mpr_softc *sc , u32 log_info)
 {
 	union loginfo_type {
 		u32	loginfo;
 		struct {
 			u32	subcode:16;
 			u32	code:8;
 			u32	originator:4;
 			u32	bus_type:4;
 		} dw;
 	};
 	union loginfo_type sas_loginfo;
 	char *originator_str = NULL;
 
 	sas_loginfo.loginfo = log_info;
 	if (sas_loginfo.dw.bus_type != 3 /*SAS*/)
 		return;
 
 	/* each nexus loss loginfo */
 	if (log_info == 0x31170000)
 		return;
 
 	/* eat the loginfos associated with task aborts */
 	if ((log_info == 30050000) || (log_info == 0x31140000) ||
 	    (log_info == 0x31130000))
 		return;
 
 	switch (sas_loginfo.dw.originator) {
 	case 0:
 		originator_str = "IOP";
 		break;
 	case 1:
 		originator_str = "PL";
 		break;
 	case 2:
 		originator_str = "IR";
 		break;
 	}
 
 	mpr_dprint(sc, MPR_LOG, "log_info(0x%08x): originator(%s), "
 	    "code(0x%02x), sub_code(0x%04x)\n", log_info, originator_str,
 	    sas_loginfo.dw.code, sas_loginfo.dw.subcode);
 }
 
 static void
 mpr_display_reply_info(struct mpr_softc *sc, uint8_t *reply)
 {
 	MPI2DefaultReply_t *mpi_reply;
 	u16 sc_status;
 
 	mpi_reply = (MPI2DefaultReply_t*)reply;
 	sc_status = le16toh(mpi_reply->IOCStatus);
 	if (sc_status & MPI2_IOCSTATUS_FLAG_LOG_INFO_AVAILABLE)
 		mpr_sas_log_info(sc, le32toh(mpi_reply->IOCLogInfo));
 }
 
 void
 mpr_intr(void *data)
 {
 	struct mpr_softc *sc;
 	uint32_t status;
 
 	sc = (struct mpr_softc *)data;
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	/*
 	 * Check interrupt status register to flush the bus.  This is
 	 * needed for both INTx interrupts and driver-driven polling
 	 */
 	status = mpr_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET);
 	if ((status & MPI2_HIS_REPLY_DESCRIPTOR_INTERRUPT) == 0)
 		return;
 
 	mpr_lock(sc);
 	mpr_intr_locked(data);
 	mpr_unlock(sc);
 	return;
 }
 
 /*
  * In theory, MSI/MSIX interrupts shouldn't need to read any registers on the
  * chip.  Hopefully this theory is correct.
  */
 void
 mpr_intr_msi(void *data)
 {
 	struct mpr_softc *sc;
 
 	sc = (struct mpr_softc *)data;
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 	mpr_lock(sc);
 	mpr_intr_locked(data);
 	mpr_unlock(sc);
 	return;
 }
 
 /*
  * The locking is overly broad and simplistic, but easy to deal with for now.
  */
 void
 mpr_intr_locked(void *data)
 {
 	MPI2_REPLY_DESCRIPTORS_UNION *desc;
 	MPI2_DIAG_RELEASE_REPLY *rel_rep;
 	mpr_fw_diagnostic_buffer_t *pBuffer;
 	struct mpr_softc *sc;
 	uint64_t tdesc;
 	struct mpr_command *cm = NULL;
 	uint8_t flags;
 	u_int pq;
 
 	sc = (struct mpr_softc *)data;
 
 	pq = sc->replypostindex;
 	mpr_dprint(sc, MPR_TRACE,
 	    "%s sc %p starting with replypostindex %u\n", 
 	    __func__, sc, sc->replypostindex);
 
 	for ( ;; ) {
 		cm = NULL;
 		desc = &sc->post_queue[sc->replypostindex];
 
 		/*
 		 * Copy and clear out the descriptor so that any reentry will
 		 * immediately know that this descriptor has already been
 		 * looked at.  There is unfortunate casting magic because the
 		 * MPI API doesn't have a cardinal 64bit type.
 		 */
 		tdesc = 0xffffffffffffffff;
 		tdesc = atomic_swap_64((uint64_t *)desc, tdesc);
 		desc = (MPI2_REPLY_DESCRIPTORS_UNION *)&tdesc;
 
 		flags = desc->Default.ReplyFlags &
 		    MPI2_RPY_DESCRIPT_FLAGS_TYPE_MASK;
 		if ((flags == MPI2_RPY_DESCRIPT_FLAGS_UNUSED) ||
 		    (le32toh(desc->Words.High) == 0xffffffff))
 			break;
 
 		/* increment the replypostindex now, so that event handlers
 		 * and cm completion handlers which decide to do a diag
 		 * reset can zero it without it getting incremented again
 		 * afterwards, and we break out of this loop on the next
 		 * iteration since the reply post queue has been cleared to
 		 * 0xFF and all descriptors look unused (which they are).
 		 */
 		if (++sc->replypostindex >= sc->pqdepth)
 			sc->replypostindex = 0;
 
 		switch (flags) {
 		case MPI2_RPY_DESCRIPT_FLAGS_SCSI_IO_SUCCESS:
 		case MPI25_RPY_DESCRIPT_FLAGS_FAST_PATH_SCSI_IO_SUCCESS:
 		case MPI26_RPY_DESCRIPT_FLAGS_PCIE_ENCAPSULATED_SUCCESS:
 			cm = &sc->commands[le16toh(desc->SCSIIOSuccess.SMID)];
 			KASSERT(cm->cm_state == MPR_CM_STATE_INQUEUE,
 			    ("command not inqueue\n"));
 			cm->cm_state = MPR_CM_STATE_BUSY;
 			cm->cm_reply = NULL;
 			break;
 		case MPI2_RPY_DESCRIPT_FLAGS_ADDRESS_REPLY:
 		{
 			uint32_t baddr;
 			uint8_t *reply;
 
 			/*
 			 * Re-compose the reply address from the address
 			 * sent back from the chip.  The ReplyFrameAddress
 			 * is the lower 32 bits of the physical address of
 			 * particular reply frame.  Convert that address to
 			 * host format, and then use that to provide the
 			 * offset against the virtual address base
 			 * (sc->reply_frames).
 			 */
 			baddr = le32toh(desc->AddressReply.ReplyFrameAddress);
 			reply = sc->reply_frames +
 				(baddr - ((uint32_t)sc->reply_busaddr));
 			/*
 			 * Make sure the reply we got back is in a valid
 			 * range.  If not, go ahead and panic here, since
 			 * we'll probably panic as soon as we deference the
 			 * reply pointer anyway.
 			 */
 			if ((reply < sc->reply_frames)
 			 || (reply > (sc->reply_frames +
 			     (sc->fqdepth * sc->replyframesz)))) {
 				printf("%s: WARNING: reply %p out of range!\n",
 				       __func__, reply);
 				printf("%s: reply_frames %p, fqdepth %d, "
 				       "frame size %d\n", __func__,
 				       sc->reply_frames, sc->fqdepth,
 				       sc->replyframesz);
 				printf("%s: baddr %#x,\n", __func__, baddr);
 				/* LSI-TODO. See Linux Code for Graceful exit */
 				panic("Reply address out of range");
 			}
 			if (le16toh(desc->AddressReply.SMID) == 0) {
 				if (((MPI2_DEFAULT_REPLY *)reply)->Function ==
 				    MPI2_FUNCTION_DIAG_BUFFER_POST) {
 					/*
 					 * If SMID is 0 for Diag Buffer Post,
 					 * this implies that the reply is due to
 					 * a release function with a status that
 					 * the buffer has been released.  Set
 					 * the buffer flags accordingly.
 					 */
 					rel_rep =
 					    (MPI2_DIAG_RELEASE_REPLY *)reply;
 					if ((le16toh(rel_rep->IOCStatus) &
 					    MPI2_IOCSTATUS_MASK) ==
 					    MPI2_IOCSTATUS_DIAGNOSTIC_RELEASED)
 					{
 						pBuffer =
 						    &sc->fw_diag_buffer_list[
 						    rel_rep->BufferType];
 						pBuffer->valid_data = TRUE;
 						pBuffer->owned_by_firmware =
 						    FALSE;
 						pBuffer->immediate = FALSE;
 					}
 				} else
 					mpr_dispatch_event(sc, baddr,
 					    (MPI2_EVENT_NOTIFICATION_REPLY *)
 					    reply);
 			} else {
 				cm = &sc->commands[
 				    le16toh(desc->AddressReply.SMID)];
 				if (cm->cm_state == MPR_CM_STATE_INQUEUE) {
 					cm->cm_reply = reply;
 					cm->cm_reply_data =
 					    le32toh(desc->AddressReply.
 						ReplyFrameAddress);
 				} else {
 					mpr_dprint(sc, MPR_RECOVERY,
 					    "Bad state for ADDRESS_REPLY status,"
 					    " ignoring state %d cm %p\n",
 					    cm->cm_state, cm);
 				}
 			}
 			break;
 		}
 		case MPI2_RPY_DESCRIPT_FLAGS_TARGETASSIST_SUCCESS:
 		case MPI2_RPY_DESCRIPT_FLAGS_TARGET_COMMAND_BUFFER:
 		case MPI2_RPY_DESCRIPT_FLAGS_RAID_ACCELERATOR_SUCCESS:
 		default:
 			/* Unhandled */
 			mpr_dprint(sc, MPR_ERROR, "Unhandled reply 0x%x\n",
 			    desc->Default.ReplyFlags);
 			cm = NULL;
 			break;
 		}
 
 		if (cm != NULL) {
 			// Print Error reply frame
 			if (cm->cm_reply)
 				mpr_display_reply_info(sc,cm->cm_reply);
 			mpr_complete_command(sc, cm);
 		}
 	}
 
 	if (pq != sc->replypostindex) {
 		mpr_dprint(sc, MPR_TRACE, "%s sc %p writing postindex %d\n",
 		    __func__, sc, sc->replypostindex);
 		mpr_regwrite(sc, MPI2_REPLY_POST_HOST_INDEX_OFFSET,
 		    sc->replypostindex);
 	}
 
 	return;
 }
 
 static void
 mpr_dispatch_event(struct mpr_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *reply)
 {
 	struct mpr_event_handle *eh;
 	int event, handled = 0;
 
 	event = le16toh(reply->Event);
 	TAILQ_FOREACH(eh, &sc->event_list, eh_list) {
 		if (isset(eh->mask, event)) {
 			eh->callback(sc, data, reply);
 			handled++;
 		}
 	}
 
 	if (handled == 0)
 		mpr_dprint(sc, MPR_EVENT, "Unhandled event 0x%x\n",
 		    le16toh(event));
 
 	/*
 	 * This is the only place that the event/reply should be freed.
 	 * Anything wanting to hold onto the event data should have
 	 * already copied it into their own storage.
 	 */
 	mpr_free_reply(sc, data);
 }
 
 static void
 mpr_reregister_events_complete(struct mpr_softc *sc, struct mpr_command *cm)
 {
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	if (cm->cm_reply)
 		MPR_DPRINT_EVENT(sc, generic,
 			(MPI2_EVENT_NOTIFICATION_REPLY *)cm->cm_reply);
 
 	mpr_free_command(sc, cm);
 
 	/* next, send a port enable */
 	mprsas_startup(sc);
 }
 
 /*
  * For both register_events and update_events, the caller supplies a bitmap
  * of events that it _wants_.  These functions then turn that into a bitmask
  * suitable for the controller.
  */
 int
 mpr_register_events(struct mpr_softc *sc, uint8_t *mask,
     mpr_evt_callback_t *cb, void *data, struct mpr_event_handle **handle)
 {
 	struct mpr_event_handle *eh;
 	int error = 0;
 
 	eh = malloc(sizeof(struct mpr_event_handle), M_MPR, M_WAITOK|M_ZERO);
 	eh->callback = cb;
 	eh->data = data;
 	TAILQ_INSERT_TAIL(&sc->event_list, eh, eh_list);
 	if (mask != NULL)
 		error = mpr_update_events(sc, eh, mask);
 	*handle = eh;
 
 	return (error);
 }
 
 int
 mpr_update_events(struct mpr_softc *sc, struct mpr_event_handle *handle,
     uint8_t *mask)
 {
 	MPI2_EVENT_NOTIFICATION_REQUEST *evtreq;
 	MPI2_EVENT_NOTIFICATION_REPLY *reply = NULL;
 	struct mpr_command *cm = NULL;
 	struct mpr_event_handle *eh;
 	int error, i;
 
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	if ((mask != NULL) && (handle != NULL))
 		bcopy(mask, &handle->mask[0], 16);
 	memset(sc->event_mask, 0xff, 16);
 
 	TAILQ_FOREACH(eh, &sc->event_list, eh_list) {
 		for (i = 0; i < 16; i++)
 			sc->event_mask[i] &= ~eh->mask[i];
 	}
 
 	if ((cm = mpr_alloc_command(sc)) == NULL)
 		return (EBUSY);
 	evtreq = (MPI2_EVENT_NOTIFICATION_REQUEST *)cm->cm_req;
 	evtreq->Function = MPI2_FUNCTION_EVENT_NOTIFICATION;
 	evtreq->MsgFlags = 0;
 	evtreq->SASBroadcastPrimitiveMasks = 0;
 #ifdef MPR_DEBUG_ALL_EVENTS
 	{
 		u_char fullmask[16];
 		memset(fullmask, 0x00, 16);
 		bcopy(fullmask, (uint8_t *)&evtreq->EventMasks, 16);
 	}
 #else
 		bcopy(sc->event_mask, (uint8_t *)&evtreq->EventMasks, 16);
 #endif
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_data = NULL;
 
 	error = mpr_request_polled(sc, &cm);
 	if (cm != NULL)
 		reply = (MPI2_EVENT_NOTIFICATION_REPLY *)cm->cm_reply;
 	if ((reply == NULL) ||
 	    (reply->IOCStatus & MPI2_IOCSTATUS_MASK) != MPI2_IOCSTATUS_SUCCESS)
 		error = ENXIO;
 
 	if (reply)
 		MPR_DPRINT_EVENT(sc, generic, reply);
 
 	mpr_dprint(sc, MPR_TRACE, "%s finished error %d\n", __func__, error);
 
 	if (cm != NULL)
 		mpr_free_command(sc, cm);
 	return (error);
 }
 
 static int
 mpr_reregister_events(struct mpr_softc *sc)
 {
 	MPI2_EVENT_NOTIFICATION_REQUEST *evtreq;
 	struct mpr_command *cm;
 	struct mpr_event_handle *eh;
 	int error, i;
 
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	/* first, reregister events */
 
 	memset(sc->event_mask, 0xff, 16);
 
 	TAILQ_FOREACH(eh, &sc->event_list, eh_list) {
 		for (i = 0; i < 16; i++)
 			sc->event_mask[i] &= ~eh->mask[i];
 	}
 
 	if ((cm = mpr_alloc_command(sc)) == NULL)
 		return (EBUSY);
 	evtreq = (MPI2_EVENT_NOTIFICATION_REQUEST *)cm->cm_req;
 	evtreq->Function = MPI2_FUNCTION_EVENT_NOTIFICATION;
 	evtreq->MsgFlags = 0;
 	evtreq->SASBroadcastPrimitiveMasks = 0;
 #ifdef MPR_DEBUG_ALL_EVENTS
 	{
 		u_char fullmask[16];
 		memset(fullmask, 0x00, 16);
 		bcopy(fullmask, (uint8_t *)&evtreq->EventMasks, 16);
 	}
 #else
 		bcopy(sc->event_mask, (uint8_t *)&evtreq->EventMasks, 16);
 #endif
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_data = NULL;
 	cm->cm_complete = mpr_reregister_events_complete;
 
 	error = mpr_map_command(sc, cm);
 
 	mpr_dprint(sc, MPR_TRACE, "%s finished with error %d\n", __func__,
 	    error);
 	return (error);
 }
 
 int
 mpr_deregister_events(struct mpr_softc *sc, struct mpr_event_handle *handle)
 {
 
 	TAILQ_REMOVE(&sc->event_list, handle, eh_list);
 	free(handle, M_MPR);
 	return (mpr_update_events(sc, NULL, NULL));
 }
 
 /**
 * mpr_build_nvme_prp - This function is called for NVMe end devices to build a
 * native SGL (NVMe PRP). The native SGL is built starting in the first PRP entry
 * of the NVMe message (PRP1). If the data buffer is small enough to be described
 * entirely using PRP1, then PRP2 is not used. If needed, PRP2 is used to
 * describe a larger data buffer. If the data buffer is too large to describe
 * using the two PRP entriess inside the NVMe message, then PRP1 describes the
 * first data memory segment, and PRP2 contains a pointer to a PRP list located
 * elsewhere in memory to describe the remaining data memory segments. The PRP
 * list will be contiguous.
 
 * The native SGL for NVMe devices is a Physical Region Page (PRP). A PRP
 * consists of a list of PRP entries to describe a number of noncontigous
 * physical memory segments as a single memory buffer, just as a SGL does. Note
 * however, that this function is only used by the IOCTL call, so the memory
 * given will be guaranteed to be contiguous. There is no need to translate
 * non-contiguous SGL into a PRP in this case. All PRPs will describe contiguous
 * space that is one page size each.
 *
 * Each NVMe message contains two PRP entries. The first (PRP1) either contains
 * a PRP list pointer or a PRP element, depending upon the command. PRP2 contains
 * the second PRP element if the memory being described fits within 2 PRP
 * entries, or a PRP list pointer if the PRP spans more than two entries.
 *
 * A PRP list pointer contains the address of a PRP list, structured as a linear
 * array of PRP entries. Each PRP entry in this list describes a segment of
 * physical memory.
 *
 * Each 64-bit PRP entry comprises an address and an offset field. The address
 * always points to the beginning of a PAGE_SIZE physical memory page, and the
 * offset describes where within that page the memory segment begins. Only the
 * first element in a PRP list may contain a non-zero offest, implying that all
 * memory segments following the first begin at the start of a PAGE_SIZE page.
 *
 * Each PRP element normally describes a chunck of PAGE_SIZE physical memory,
 * with exceptions for the first and last elements in the list. If the memory
 * being described by the list begins at a non-zero offset within the first page,
 * then the first PRP element will contain a non-zero offset indicating where the
 * region begins within the page. The last memory segment may end before the end
 * of the PAGE_SIZE segment, depending upon the overall size of the memory being
 * described by the PRP list. 
 *
 * Since PRP entries lack any indication of size, the overall data buffer length
 * is used to determine where the end of the data memory buffer is located, and
 * how many PRP entries are required to describe it.
 *
 * Returns nothing.
 */
 void 
 mpr_build_nvme_prp(struct mpr_softc *sc, struct mpr_command *cm,
     Mpi26NVMeEncapsulatedRequest_t *nvme_encap_request, void *data,
     uint32_t data_in_sz, uint32_t data_out_sz)
 {
 	int			prp_size = PRP_ENTRY_SIZE;
 	uint64_t		*prp_entry, *prp1_entry, *prp2_entry;
 	uint64_t		*prp_entry_phys, *prp_page, *prp_page_phys;
 	uint32_t		offset, entry_len, page_mask_result, page_mask;
 	bus_addr_t		paddr;
 	size_t			length;
 	struct mpr_prp_page	*prp_page_info = NULL;
 
 	/*
 	 * Not all commands require a data transfer. If no data, just return
 	 * without constructing any PRP.
 	 */
 	if (!data_in_sz && !data_out_sz)
 		return;
 
 	/*
 	 * Set pointers to PRP1 and PRP2, which are in the NVMe command. PRP1 is
 	 * located at a 24 byte offset from the start of the NVMe command. Then
 	 * set the current PRP entry pointer to PRP1.
 	 */
 	prp1_entry = (uint64_t *)(nvme_encap_request->NVMe_Command +
 	    NVME_CMD_PRP1_OFFSET);
 	prp2_entry = (uint64_t *)(nvme_encap_request->NVMe_Command +
 	    NVME_CMD_PRP2_OFFSET);
 	prp_entry = prp1_entry;
 
 	/*
 	 * For the PRP entries, use the specially allocated buffer of
 	 * contiguous memory. PRP Page allocation failures should not happen
 	 * because there should be enough PRP page buffers to account for the
 	 * possible NVMe QDepth.
 	 */
 	prp_page_info = mpr_alloc_prp_page(sc);
 	KASSERT(prp_page_info != NULL, ("%s: There are no PRP Pages left to be "
 	    "used for building a native NVMe SGL.\n", __func__));
 	prp_page = (uint64_t *)prp_page_info->prp_page;
 	prp_page_phys = (uint64_t *)(uintptr_t)prp_page_info->prp_page_busaddr;
 
 	/*
 	 * Insert the allocated PRP page into the command's PRP page list. This
 	 * will be freed when the command is freed.
 	 */
 	TAILQ_INSERT_TAIL(&cm->cm_prp_page_list, prp_page_info, prp_page_link);
 
 	/*
 	 * Check if we are within 1 entry of a page boundary we don't want our
 	 * first entry to be a PRP List entry.
 	 */
 	page_mask = PAGE_SIZE - 1;
 	page_mask_result = (uintptr_t)((uint8_t *)prp_page + prp_size) &
 	    page_mask;
 	if (!page_mask_result)
 	{
 		/* Bump up to next page boundary. */
 		prp_page = (uint64_t *)((uint8_t *)prp_page + prp_size);
 		prp_page_phys = (uint64_t *)((uint8_t *)prp_page_phys +
 		    prp_size);
 	}
 
 	/*
 	 * Set PRP physical pointer, which initially points to the current PRP
 	 * DMA memory page.
 	 */
 	prp_entry_phys = prp_page_phys;
 
 	/* Get physical address and length of the data buffer. */
 	paddr = (bus_addr_t)(uintptr_t)data;
 	if (data_in_sz)
 		length = data_in_sz;
 	else
 		length = data_out_sz;
 
 	/* Loop while the length is not zero. */
 	while (length)
 	{
 		/*
 		 * Check if we need to put a list pointer here if we are at page
 		 * boundary - prp_size (8 bytes).
 		 */
 		page_mask_result = (uintptr_t)((uint8_t *)prp_entry_phys +
 		    prp_size) & page_mask;
 		if (!page_mask_result)
 		{
 			/*
 			 * This is the last entry in a PRP List, so we need to
 			 * put a PRP list pointer here. What this does is:
 			 *   - bump the current memory pointer to the next
 			 *     address, which will be the next full page.
 			 *   - set the PRP Entry to point to that page. This is
 			 *     now the PRP List pointer.
 			 *   - bump the PRP Entry pointer the start of the next
 			 *     page. Since all of this PRP memory is contiguous,
 			 *     no need to get a new page - it's just the next
 			 *     address.
 			 */
 			prp_entry_phys++;
 			*prp_entry =
 			    htole64((uint64_t)(uintptr_t)prp_entry_phys);
 			prp_entry++;
 		}
 
 		/* Need to handle if entry will be part of a page. */
 		offset = (uint32_t)paddr & page_mask;
 		entry_len = PAGE_SIZE - offset;
 
 		if (prp_entry == prp1_entry)
 		{
 			/*
 			 * Must fill in the first PRP pointer (PRP1) before
 			 * moving on.
 			 */
 			*prp1_entry = htole64((uint64_t)paddr);
 
 			/*
 			 * Now point to the second PRP entry within the
 			 * command (PRP2).
 			 */
 			prp_entry = prp2_entry;
 		}
 		else if (prp_entry == prp2_entry)
 		{
 			/*
 			 * Should the PRP2 entry be a PRP List pointer or just a
 			 * regular PRP pointer? If there is more than one more
 			 * page of data, must use a PRP List pointer.
 			 */
 			if (length > PAGE_SIZE)
 			{
 				/*
 				 * PRP2 will contain a PRP List pointer because
 				 * more PRP's are needed with this command. The
 				 * list will start at the beginning of the
 				 * contiguous buffer.
 				 */
 				*prp2_entry =
 				    htole64(
 				    (uint64_t)(uintptr_t)prp_entry_phys);
 
 				/*
 				 * The next PRP Entry will be the start of the
 				 * first PRP List.
 				 */
 				prp_entry = prp_page;
 			}
 			else
 			{
 				/*
 				 * After this, the PRP Entries are complete.
 				 * This command uses 2 PRP's and no PRP list.
 				 */
 				*prp2_entry = htole64((uint64_t)paddr);
 			}
 		}
 		else
 		{
 			/*
 			 * Put entry in list and bump the addresses.
 			 *
 			 * After PRP1 and PRP2 are filled in, this will fill in
 			 * all remaining PRP entries in a PRP List, one per each
 			 * time through the loop.
 			 */
 			*prp_entry = htole64((uint64_t)paddr);
 			prp_entry++;
 			prp_entry_phys++;
 		}
 
 		/*
 		 * Bump the phys address of the command's data buffer by the
 		 * entry_len.
 		 */
 		paddr += entry_len;
 
 		/* Decrement length accounting for last partial page. */
 		if (entry_len > length)
 			length = 0;
 		else
 			length -= entry_len;
 	}
 }
 
 /*
  * mpr_check_pcie_native_sgl - This function is called for PCIe end devices to
  * determine if the driver needs to build a native SGL. If so, that native SGL
  * is built in the contiguous buffers allocated especially for PCIe SGL
  * creation. If the driver will not build a native SGL, return TRUE and a
  * normal IEEE SGL will be built. Currently this routine supports NVMe devices
  * only.
  *
  * Returns FALSE (0) if native SGL was built, TRUE (1) if no SGL was built.
  */
 static int
 mpr_check_pcie_native_sgl(struct mpr_softc *sc, struct mpr_command *cm,
     bus_dma_segment_t *segs, int segs_left)
 {
 	uint32_t		i, sge_dwords, length, offset, entry_len;
 	uint32_t		num_entries, buff_len = 0, sges_in_segment;
 	uint32_t		page_mask, page_mask_result, *curr_buff;
 	uint32_t		*ptr_sgl, *ptr_first_sgl, first_page_offset;
 	uint32_t		first_page_data_size, end_residual;
 	uint64_t		*msg_phys;
 	bus_addr_t		paddr;
 	int			build_native_sgl = 0, first_prp_entry;
 	int			prp_size = PRP_ENTRY_SIZE;
 	Mpi25IeeeSgeChain64_t	*main_chain_element = NULL;
 	struct mpr_prp_page	*prp_page_info = NULL;
 
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	/*
 	 * Add up the sizes of each segment length to get the total transfer
 	 * size, which will be checked against the Maximum Data Transfer Size.
 	 * If the data transfer length exceeds the MDTS for this device, just
 	 * return 1 so a normal IEEE SGL will be built. F/W will break the I/O
 	 * up into multiple I/O's. [nvme_mdts = 0 means unlimited]
 	 */
 	for (i = 0; i < segs_left; i++)
 		buff_len += htole32(segs[i].ds_len);
 	if ((cm->cm_targ->MDTS > 0) && (buff_len > cm->cm_targ->MDTS))
 		return 1;
 
 	/* Create page_mask (to get offset within page) */
 	page_mask = PAGE_SIZE - 1;
 
 	/*
 	 * Check if the number of elements exceeds the max number that can be
 	 * put in the main message frame (H/W can only translate an SGL that
 	 * is contained entirely in the main message frame).
 	 */
 	sges_in_segment = (sc->reqframesz -
 	    offsetof(Mpi25SCSIIORequest_t, SGL)) / sizeof(MPI25_SGE_IO_UNION);
 	if (segs_left > sges_in_segment)
 		build_native_sgl = 1;
 	else
 	{
 		/*
 		 * NVMe uses one PRP for each physical page (or part of physical
 		 * page).
 		 *    if 4 pages or less then IEEE is OK
 		 *    if > 5 pages then we need to build a native SGL
 		 *    if > 4 and <= 5 pages, then check the physical address of
 		 *      the first SG entry, then if this first size in the page
 		 *      is >= the residual beyond 4 pages then use IEEE,
 		 *      otherwise use native SGL
 		 */
 		if (buff_len > (PAGE_SIZE * 5))
 			build_native_sgl = 1;
 		else if ((buff_len > (PAGE_SIZE * 4)) &&
 		    (buff_len <= (PAGE_SIZE * 5)) )
 		{
 			msg_phys = (uint64_t *)(uintptr_t)segs[0].ds_addr;
 			first_page_offset =
 			    ((uint32_t)(uint64_t)(uintptr_t)msg_phys &
 			    page_mask);
 			first_page_data_size = PAGE_SIZE - first_page_offset;
 			end_residual = buff_len % PAGE_SIZE;
 
 			/*
 			 * If offset into first page pushes the end of the data
 			 * beyond end of the 5th page, we need the extra PRP
 			 * list.
 			 */
 			if (first_page_data_size < end_residual)
 				build_native_sgl = 1;
 
 			/*
 			 * Check if first SG entry size is < residual beyond 4
 			 * pages.
 			 */
 			if (htole32(segs[0].ds_len) <
 			    (buff_len - (PAGE_SIZE * 4)))
 				build_native_sgl = 1;
 		}
 	}
 
 	/* check if native SGL is needed */
 	if (!build_native_sgl)
 		return 1;
 
 	/*
 	 * Native SGL is needed.
 	 * Put a chain element in main message frame that points to the first
 	 * chain buffer.
 	 *
 	 * NOTE:  The ChainOffset field must be 0 when using a chain pointer to
 	 *        a native SGL.
 	 */
 
 	/* Set main message chain element pointer */
 	main_chain_element = (pMpi25IeeeSgeChain64_t)cm->cm_sge;
 
 	/*
 	 * For NVMe the chain element needs to be the 2nd SGL entry in the main
 	 * message.
 	 */
 	main_chain_element = (Mpi25IeeeSgeChain64_t *)
 	    ((uint8_t *)main_chain_element + sizeof(MPI25_IEEE_SGE_CHAIN64));
 
 	/*
 	 * For the PRP entries, use the specially allocated buffer of
 	 * contiguous memory. PRP Page allocation failures should not happen
 	 * because there should be enough PRP page buffers to account for the
 	 * possible NVMe QDepth.
 	 */
 	prp_page_info = mpr_alloc_prp_page(sc);
 	KASSERT(prp_page_info != NULL, ("%s: There are no PRP Pages left to be "
 	    "used for building a native NVMe SGL.\n", __func__));
 	curr_buff = (uint32_t *)prp_page_info->prp_page;
 	msg_phys = (uint64_t *)(uintptr_t)prp_page_info->prp_page_busaddr;
 
 	/*
 	 * Insert the allocated PRP page into the command's PRP page list. This
 	 * will be freed when the command is freed.
 	 */
 	TAILQ_INSERT_TAIL(&cm->cm_prp_page_list, prp_page_info, prp_page_link);
 
 	/*
 	 * Check if we are within 1 entry of a page boundary we don't want our
 	 * first entry to be a PRP List entry.
 	 */
 	page_mask_result = (uintptr_t)((uint8_t *)curr_buff + prp_size) &
 	    page_mask;
 	if (!page_mask_result) {
 		/* Bump up to next page boundary. */
 		curr_buff = (uint32_t *)((uint8_t *)curr_buff + prp_size);
 		msg_phys = (uint64_t *)((uint8_t *)msg_phys + prp_size);
 	}
 
 	/* Fill in the chain element and make it an NVMe segment type. */
 	main_chain_element->Address.High =
 	    htole32((uint32_t)((uint64_t)(uintptr_t)msg_phys >> 32));
 	main_chain_element->Address.Low =
 	    htole32((uint32_t)(uintptr_t)msg_phys);
 	main_chain_element->NextChainOffset = 0;
 	main_chain_element->Flags = MPI2_IEEE_SGE_FLAGS_CHAIN_ELEMENT |
 	    MPI2_IEEE_SGE_FLAGS_SYSTEM_ADDR |
 	    MPI26_IEEE_SGE_FLAGS_NSF_NVME_PRP;
 
 	/* Set SGL pointer to start of contiguous PCIe buffer. */
 	ptr_sgl = curr_buff;
 	sge_dwords = 2;
 	num_entries = 0;
 
 	/*
 	 * NVMe has a very convoluted PRP format. One PRP is required for each
 	 * page or partial page. We need to split up OS SG entries if they are
 	 * longer than one page or cross a page boundary. We also have to insert
 	 * a PRP list pointer entry as the last entry in each physical page of
 	 * the PRP list.
 	 *
 	 * NOTE: The first PRP "entry" is actually placed in the first SGL entry
 	 * in the main message in IEEE 64 format. The 2nd entry in the main
 	 * message is the chain element, and the rest of the PRP entries are
 	 * built in the contiguous PCIe buffer.
 	 */
 	first_prp_entry = 1;
 	ptr_first_sgl = (uint32_t *)cm->cm_sge;
 
 	for (i = 0; i < segs_left; i++) {
 		/* Get physical address and length of this SG entry. */
 		paddr = segs[i].ds_addr;
 		length = segs[i].ds_len;
 
 		/*
 		 * Check whether a given SGE buffer lies on a non-PAGED
 		 * boundary if this is not the first page. If so, this is not
 		 * expected so have FW build the SGL.
 		 */
 		if ((i != 0) && (((uint32_t)paddr & page_mask) != 0)) {
 			mpr_dprint(sc, MPR_ERROR, "Unaligned SGE while "
 			    "building NVMe PRPs, low address is 0x%x\n",
 			    (uint32_t)paddr);
 			return 1;
 		}
 
 		/* Apart from last SGE, if any other SGE boundary is not page
 		 * aligned then it means that hole exists. Existence of hole
 		 * leads to data corruption. So fallback to IEEE SGEs.
 		 */
 		if (i != (segs_left - 1)) {
 			if (((uint32_t)paddr + length) & page_mask) {
 				mpr_dprint(sc, MPR_ERROR, "Unaligned SGE "
 				    "boundary while building NVMe PRPs, low "
 				    "address: 0x%x and length: %u\n",
 				    (uint32_t)paddr, length);
 				return 1;
 			}
 		}
 
 		/* Loop while the length is not zero. */
 		while (length) {
 			/*
 			 * Check if we need to put a list pointer here if we are
 			 * at page boundary - prp_size.
 			 */
 			page_mask_result = (uintptr_t)((uint8_t *)ptr_sgl +
 			    prp_size) & page_mask;
 			if (!page_mask_result) {
 				/*
 				 * Need to put a PRP list pointer here.
 				 */
 				msg_phys = (uint64_t *)((uint8_t *)msg_phys +
 				    prp_size);
 				*ptr_sgl = htole32((uintptr_t)msg_phys);
 				*(ptr_sgl+1) = htole32((uint64_t)(uintptr_t)
 				    msg_phys >> 32);
 				ptr_sgl += sge_dwords;
 				num_entries++;
 			}
 
 			/* Need to handle if entry will be part of a page. */
 			offset = (uint32_t)paddr & page_mask;
 			entry_len = PAGE_SIZE - offset;
 			if (first_prp_entry) {
 				/*
 				 * Put IEEE entry in first SGE in main message.
 				 * (Simple element, System addr, not end of
 				 * list.)
 				 */
 				*ptr_first_sgl = htole32((uint32_t)paddr);
 				*(ptr_first_sgl + 1) =
 				    htole32((uint32_t)((uint64_t)paddr >> 32));
 				*(ptr_first_sgl + 2) = htole32(entry_len);
 				*(ptr_first_sgl + 3) = 0;
 
 				/* No longer the first PRP entry. */
 				first_prp_entry = 0;
 			} else {
 				/* Put entry in list. */
 				*ptr_sgl = htole32((uint32_t)paddr);
 				*(ptr_sgl + 1) =
 				    htole32((uint32_t)((uint64_t)paddr >> 32));
 
 				/* Bump ptr_sgl, msg_phys, and num_entries. */
 				ptr_sgl += sge_dwords;
 				msg_phys = (uint64_t *)((uint8_t *)msg_phys +
 				    prp_size);
 				num_entries++;
 			}
 
 			/* Bump the phys address by the entry_len. */
 			paddr += entry_len;
 
 			/* Decrement length accounting for last partial page. */
 			if (entry_len > length)
 				length = 0;
 			else
 				length -= entry_len;
 		}
 	}
 
 	/* Set chain element Length. */
 	main_chain_element->Length = htole32(num_entries * prp_size);
 
 	/* Return 0, indicating we built a native SGL. */
 	return 0;
 }
 
 /*
  * Add a chain element as the next SGE for the specified command.
  * Reset cm_sge and cm_sgesize to indicate all the available space. Chains are
  * only required for IEEE commands.  Therefore there is no code for commands
  * that have the MPR_CM_FLAGS_SGE_SIMPLE flag set (and those commands
  * shouldn't be requesting chains).
  */
 static int
 mpr_add_chain(struct mpr_command *cm, int segsleft)
 {
 	struct mpr_softc *sc = cm->cm_sc;
 	MPI2_REQUEST_HEADER *req;
 	MPI25_IEEE_SGE_CHAIN64 *ieee_sgc;
 	struct mpr_chain *chain;
 	int sgc_size, current_segs, rem_segs, segs_per_frame;
 	uint8_t next_chain_offset = 0;
 
 	/*
 	 * Fail if a command is requesting a chain for SIMPLE SGE's.  For SAS3
 	 * only IEEE commands should be requesting chains.  Return some error
 	 * code other than 0.
 	 */
 	if (cm->cm_flags & MPR_CM_FLAGS_SGE_SIMPLE) {
 		mpr_dprint(sc, MPR_ERROR, "A chain element cannot be added to "
 		    "an MPI SGL.\n");
 		return(ENOBUFS);
 	}
 
 	sgc_size = sizeof(MPI25_IEEE_SGE_CHAIN64);
 	if (cm->cm_sglsize < sgc_size)
 		panic("MPR: Need SGE Error Code\n");
 
 	chain = mpr_alloc_chain(cm->cm_sc);
 	if (chain == NULL)
 		return (ENOBUFS);
 
 	/*
 	 * Note: a double-linked list is used to make it easier to walk for
 	 * debugging.
 	 */
 	TAILQ_INSERT_TAIL(&cm->cm_chain_list, chain, chain_link);
 
 	/*
 	 * Need to know if the number of frames left is more than 1 or not.  If
 	 * more than 1 frame is required, NextChainOffset will need to be set,
 	 * which will just be the last segment of the frame.
 	 */
 	rem_segs = 0;
 	if (cm->cm_sglsize < (sgc_size * segsleft)) {
 		/*
 		 * rem_segs is the number of segements remaining after the
 		 * segments that will go into the current frame.  Since it is
 		 * known that at least one more frame is required, account for
 		 * the chain element.  To know if more than one more frame is
 		 * required, just check if there will be a remainder after using
 		 * the current frame (with this chain) and the next frame.  If
 		 * so the NextChainOffset must be the last element of the next
 		 * frame.
 		 */
 		current_segs = (cm->cm_sglsize / sgc_size) - 1;
 		rem_segs = segsleft - current_segs;
 		segs_per_frame = sc->chain_frame_size / sgc_size;
 		if (rem_segs > segs_per_frame) {
 			next_chain_offset = segs_per_frame - 1;
 		}
 	}
 	ieee_sgc = &((MPI25_SGE_IO_UNION *)cm->cm_sge)->IeeeChain;
 	ieee_sgc->Length = next_chain_offset ?
 	    htole32((uint32_t)sc->chain_frame_size) :
 	    htole32((uint32_t)rem_segs * (uint32_t)sgc_size);
 	ieee_sgc->NextChainOffset = next_chain_offset;
 	ieee_sgc->Flags = (MPI2_IEEE_SGE_FLAGS_CHAIN_ELEMENT |
 	    MPI2_IEEE_SGE_FLAGS_SYSTEM_ADDR);
 	ieee_sgc->Address.Low = htole32(chain->chain_busaddr);
 	ieee_sgc->Address.High = htole32(chain->chain_busaddr >> 32);
 	cm->cm_sge = &((MPI25_SGE_IO_UNION *)chain->chain)->IeeeSimple;
 	req = (MPI2_REQUEST_HEADER *)cm->cm_req;
 	req->ChainOffset = (sc->chain_frame_size - sgc_size) >> 4;
 
 	cm->cm_sglsize = sc->chain_frame_size;
 	return (0);
 }
 
 /*
  * Add one scatter-gather element to the scatter-gather list for a command.
  * Maintain cm_sglsize and cm_sge as the remaining size and pointer to the
  * next SGE to fill in, respectively.  In Gen3, the MPI SGL does not have a
  * chain, so don't consider any chain additions.
  */
 int
 mpr_push_sge(struct mpr_command *cm, MPI2_SGE_SIMPLE64 *sge, size_t len,
     int segsleft)
 {
 	uint32_t saved_buf_len, saved_address_low, saved_address_high;
 	u32 sge_flags;
 
 	/*
 	 * case 1: >=1 more segment, no room for anything (error)
 	 * case 2: 1 more segment and enough room for it
          */
 
 	if (cm->cm_sglsize < (segsleft * sizeof(MPI2_SGE_SIMPLE64))) {
 		mpr_dprint(cm->cm_sc, MPR_ERROR,
 		    "%s: warning: Not enough room for MPI SGL in frame.\n",
 		    __func__);
 		return(ENOBUFS);
 	}
 
 	KASSERT(segsleft == 1,
 	    ("segsleft cannot be more than 1 for an MPI SGL; segsleft = %d\n",
 	    segsleft));
 
 	/*
 	 * There is one more segment left to add for the MPI SGL and there is
 	 * enough room in the frame to add it.  This is the normal case because
 	 * MPI SGL's don't have chains, otherwise something is wrong.
 	 *
 	 * If this is a bi-directional request, need to account for that
 	 * here.  Save the pre-filled sge values.  These will be used
 	 * either for the 2nd SGL or for a single direction SGL.  If
 	 * cm_out_len is non-zero, this is a bi-directional request, so
 	 * fill in the OUT SGL first, then the IN SGL, otherwise just
 	 * fill in the IN SGL.  Note that at this time, when filling in
 	 * 2 SGL's for a bi-directional request, they both use the same
 	 * DMA buffer (same cm command).
 	 */
 	saved_buf_len = sge->FlagsLength & 0x00FFFFFF;
 	saved_address_low = sge->Address.Low;
 	saved_address_high = sge->Address.High;
 	if (cm->cm_out_len) {
 		sge->FlagsLength = cm->cm_out_len |
 		    ((uint32_t)(MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 		    MPI2_SGE_FLAGS_END_OF_BUFFER |
 		    MPI2_SGE_FLAGS_HOST_TO_IOC |
 		    MPI2_SGE_FLAGS_64_BIT_ADDRESSING) <<
 		    MPI2_SGE_FLAGS_SHIFT);
 		cm->cm_sglsize -= len;
 		/* Endian Safe code */
 		sge_flags = sge->FlagsLength;
 		sge->FlagsLength = htole32(sge_flags);
 		sge->Address.High = htole32(sge->Address.High);	
 		sge->Address.Low = htole32(sge->Address.Low);
 		bcopy(sge, cm->cm_sge, len);
 		cm->cm_sge = (MPI2_SGE_IO_UNION *)((uintptr_t)cm->cm_sge + len);
 	}
 	sge->FlagsLength = saved_buf_len |
 	    ((uint32_t)(MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 	    MPI2_SGE_FLAGS_END_OF_BUFFER |
 	    MPI2_SGE_FLAGS_LAST_ELEMENT |
 	    MPI2_SGE_FLAGS_END_OF_LIST |
 	    MPI2_SGE_FLAGS_64_BIT_ADDRESSING) <<
 	    MPI2_SGE_FLAGS_SHIFT);
 	if (cm->cm_flags & MPR_CM_FLAGS_DATAIN) {
 		sge->FlagsLength |=
 		    ((uint32_t)(MPI2_SGE_FLAGS_IOC_TO_HOST) <<
 		    MPI2_SGE_FLAGS_SHIFT);
 	} else {
 		sge->FlagsLength |=
 		    ((uint32_t)(MPI2_SGE_FLAGS_HOST_TO_IOC) <<
 		    MPI2_SGE_FLAGS_SHIFT);
 	}
 	sge->Address.Low = saved_address_low;
 	sge->Address.High = saved_address_high;
 
 	cm->cm_sglsize -= len;
 	/* Endian Safe code */
 	sge_flags = sge->FlagsLength;
 	sge->FlagsLength = htole32(sge_flags);
 	sge->Address.High = htole32(sge->Address.High);	
 	sge->Address.Low = htole32(sge->Address.Low);
 	bcopy(sge, cm->cm_sge, len);
 	cm->cm_sge = (MPI2_SGE_IO_UNION *)((uintptr_t)cm->cm_sge + len);
 	return (0);
 }
 
 /*
  * Add one IEEE scatter-gather element (chain or simple) to the IEEE scatter-
  * gather list for a command.  Maintain cm_sglsize and cm_sge as the
  * remaining size and pointer to the next SGE to fill in, respectively.
  */
 int
 mpr_push_ieee_sge(struct mpr_command *cm, void *sgep, int segsleft)
 {
 	MPI2_IEEE_SGE_SIMPLE64 *sge = sgep;
 	int error, ieee_sge_size = sizeof(MPI25_SGE_IO_UNION);
 	uint32_t saved_buf_len, saved_address_low, saved_address_high;
 	uint32_t sge_length;
 
 	/*
 	 * case 1: No room for chain or segment (error).
 	 * case 2: Two or more segments left but only room for chain.
 	 * case 3: Last segment and room for it, so set flags.
 	 */
 
 	/*
 	 * There should be room for at least one element, or there is a big
 	 * problem.
 	 */
 	if (cm->cm_sglsize < ieee_sge_size)
 		panic("MPR: Need SGE Error Code\n");
 
 	if ((segsleft >= 2) && (cm->cm_sglsize < (ieee_sge_size * 2))) {
 		if ((error = mpr_add_chain(cm, segsleft)) != 0)
 			return (error);
 	}
 
 	if (segsleft == 1) {
 		/*
 		 * If this is a bi-directional request, need to account for that
 		 * here.  Save the pre-filled sge values.  These will be used
 		 * either for the 2nd SGL or for a single direction SGL.  If
 		 * cm_out_len is non-zero, this is a bi-directional request, so
 		 * fill in the OUT SGL first, then the IN SGL, otherwise just
 		 * fill in the IN SGL.  Note that at this time, when filling in
 		 * 2 SGL's for a bi-directional request, they both use the same
 		 * DMA buffer (same cm command).
 		 */
 		saved_buf_len = sge->Length;
 		saved_address_low = sge->Address.Low;
 		saved_address_high = sge->Address.High;
 		if (cm->cm_out_len) {
 			sge->Length = cm->cm_out_len;
 			sge->Flags = (MPI2_IEEE_SGE_FLAGS_SIMPLE_ELEMENT |
 			    MPI2_IEEE_SGE_FLAGS_SYSTEM_ADDR);
 			cm->cm_sglsize -= ieee_sge_size;
 			/* Endian Safe code */
 			sge_length = sge->Length;
 			sge->Length = htole32(sge_length);
 			sge->Address.High = htole32(sge->Address.High);	
 			sge->Address.Low = htole32(sge->Address.Low);
 			bcopy(sgep, cm->cm_sge, ieee_sge_size);
 			cm->cm_sge =
 			    (MPI25_SGE_IO_UNION *)((uintptr_t)cm->cm_sge +
 			    ieee_sge_size);
 		}
 		sge->Length = saved_buf_len;
 		sge->Flags = (MPI2_IEEE_SGE_FLAGS_SIMPLE_ELEMENT |
 		    MPI2_IEEE_SGE_FLAGS_SYSTEM_ADDR |
 		    MPI25_IEEE_SGE_FLAGS_END_OF_LIST);
 		sge->Address.Low = saved_address_low;
 		sge->Address.High = saved_address_high;
 	}
 
 	cm->cm_sglsize -= ieee_sge_size;
 	/* Endian Safe code */
 	sge_length = sge->Length;
 	sge->Length = htole32(sge_length);
 	sge->Address.High = htole32(sge->Address.High);	
 	sge->Address.Low = htole32(sge->Address.Low);
 	bcopy(sgep, cm->cm_sge, ieee_sge_size);
 	cm->cm_sge = (MPI25_SGE_IO_UNION *)((uintptr_t)cm->cm_sge +
 	    ieee_sge_size);
 	return (0);
 }
 
 /*
  * Add one dma segment to the scatter-gather list for a command.
  */
 int
 mpr_add_dmaseg(struct mpr_command *cm, vm_paddr_t pa, size_t len, u_int flags,
     int segsleft)
 {
 	MPI2_SGE_SIMPLE64 sge;
 	MPI2_IEEE_SGE_SIMPLE64 ieee_sge;
 
 	if (!(cm->cm_flags & MPR_CM_FLAGS_SGE_SIMPLE)) {
 		ieee_sge.Flags = (MPI2_IEEE_SGE_FLAGS_SIMPLE_ELEMENT |
 		    MPI2_IEEE_SGE_FLAGS_SYSTEM_ADDR);
 		ieee_sge.Length = len;
 		mpr_from_u64(pa, &ieee_sge.Address);
 
 		return (mpr_push_ieee_sge(cm, &ieee_sge, segsleft));
 	} else {
 		/*
 		 * This driver always uses 64-bit address elements for
 		 * simplicity.
 		 */
 		flags |= MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 		    MPI2_SGE_FLAGS_64_BIT_ADDRESSING;
 		/* Set Endian safe macro in mpr_push_sge */
 		sge.FlagsLength = len | (flags << MPI2_SGE_FLAGS_SHIFT);
 		mpr_from_u64(pa, &sge.Address);
 
 		return (mpr_push_sge(cm, &sge, sizeof sge, segsleft));
 	}
 }
 
 static void
 mpr_data_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mpr_softc *sc;
 	struct mpr_command *cm;
 	u_int i, dir, sflags;
 
 	cm = (struct mpr_command *)arg;
 	sc = cm->cm_sc;
 
 	/*
 	 * In this case, just print out a warning and let the chip tell the
 	 * user they did the wrong thing.
 	 */
 	if ((cm->cm_max_segs != 0) && (nsegs > cm->cm_max_segs)) {
 		mpr_dprint(sc, MPR_ERROR, "%s: warning: busdma returned %d "
 		    "segments, more than the %d allowed\n", __func__, nsegs,
 		    cm->cm_max_segs);
 	}
 
 	/*
 	 * Set up DMA direction flags.  Bi-directional requests are also handled
 	 * here.  In that case, both direction flags will be set.
 	 */
 	sflags = 0;
 	if (cm->cm_flags & MPR_CM_FLAGS_SMP_PASS) {
 		/*
 		 * We have to add a special case for SMP passthrough, there
 		 * is no easy way to generically handle it.  The first
 		 * S/G element is used for the command (therefore the
 		 * direction bit needs to be set).  The second one is used
 		 * for the reply.  We'll leave it to the caller to make
 		 * sure we only have two buffers.
 		 */
 		/*
 		 * Even though the busdma man page says it doesn't make
 		 * sense to have both direction flags, it does in this case.
 		 * We have one s/g element being accessed in each direction.
 		 */
 		dir = BUS_DMASYNC_PREWRITE | BUS_DMASYNC_PREREAD;
 
 		/*
 		 * Set the direction flag on the first buffer in the SMP
 		 * passthrough request.  We'll clear it for the second one.
 		 */
 		sflags |= MPI2_SGE_FLAGS_DIRECTION |
 			  MPI2_SGE_FLAGS_END_OF_BUFFER;
 	} else if (cm->cm_flags & MPR_CM_FLAGS_DATAOUT) {
 		sflags |= MPI2_SGE_FLAGS_HOST_TO_IOC;
 		dir = BUS_DMASYNC_PREWRITE;
 	} else
 		dir = BUS_DMASYNC_PREREAD;
 
 	/* Check if a native SG list is needed for an NVMe PCIe device. */
 	if (cm->cm_targ && cm->cm_targ->is_nvme &&
 	    mpr_check_pcie_native_sgl(sc, cm, segs, nsegs) == 0) {
 		/* A native SG list was built, skip to end. */
 		goto out;
 	}
 
 	for (i = 0; i < nsegs; i++) {
 		if ((cm->cm_flags & MPR_CM_FLAGS_SMP_PASS) && (i != 0)) {
 			sflags &= ~MPI2_SGE_FLAGS_DIRECTION;
 		}
 		error = mpr_add_dmaseg(cm, segs[i].ds_addr, segs[i].ds_len,
 		    sflags, nsegs - i);
 		if (error != 0) {
 			/* Resource shortage, roll back! */
 			if (ratecheck(&sc->lastfail, &mpr_chainfail_interval))
 				mpr_dprint(sc, MPR_INFO, "Out of chain frames, "
 				    "consider increasing hw.mpr.max_chains.\n");
 			cm->cm_flags |= MPR_CM_FLAGS_CHAIN_FAILED;
 			mpr_complete_command(sc, cm);
 			return;
 		}
 	}
 
 out:
 	bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap, dir);
 	mpr_enqueue_request(sc, cm);
 
 	return;
 }
 
 static void
 mpr_data_cb2(void *arg, bus_dma_segment_t *segs, int nsegs, bus_size_t mapsize,
 	     int error)
 {
 	mpr_data_cb(arg, segs, nsegs, error);
 }
 
 /*
  * This is the routine to enqueue commands ansynchronously.
  * Note that the only error path here is from bus_dmamap_load(), which can
  * return EINPROGRESS if it is waiting for resources.  Other than this, it's
  * assumed that if you have a command in-hand, then you have enough credits
  * to use it.
  */
 int
 mpr_map_command(struct mpr_softc *sc, struct mpr_command *cm)
 {
 	int error = 0;
 
 	if (cm->cm_flags & MPR_CM_FLAGS_USE_UIO) {
 		error = bus_dmamap_load_uio(sc->buffer_dmat, cm->cm_dmamap,
 		    &cm->cm_uio, mpr_data_cb2, cm, 0);
 	} else if (cm->cm_flags & MPR_CM_FLAGS_USE_CCB) {
 		error = bus_dmamap_load_ccb(sc->buffer_dmat, cm->cm_dmamap,
 		    cm->cm_data, mpr_data_cb, cm, 0);
 	} else if ((cm->cm_data != NULL) && (cm->cm_length != 0)) {
 		error = bus_dmamap_load(sc->buffer_dmat, cm->cm_dmamap,
 		    cm->cm_data, cm->cm_length, mpr_data_cb, cm, 0);
 	} else {
 		/* Add a zero-length element as needed */
 		if (cm->cm_sge != NULL)
 			mpr_add_dmaseg(cm, 0, 0, 0, 1);
 		mpr_enqueue_request(sc, cm);
 	}
 
 	return (error);
 }
 
 /*
  * This is the routine to enqueue commands synchronously.  An error of
  * EINPROGRESS from mpr_map_command() is ignored since the command will
  * be executed and enqueued automatically.  Other errors come from msleep().
  */
 int
 mpr_wait_command(struct mpr_softc *sc, struct mpr_command **cmp, int timeout,
     int sleep_flag)
 {
 	int error, rc;
 	struct timeval cur_time, start_time;
 	struct mpr_command *cm = *cmp;
 
 	if (sc->mpr_flags & MPR_FLAGS_DIAGRESET) 
 		return  EBUSY;
 
 	cm->cm_complete = NULL;
 	cm->cm_flags |= (MPR_CM_FLAGS_WAKEUP + MPR_CM_FLAGS_POLLED);
 	error = mpr_map_command(sc, cm);
 	if ((error != 0) && (error != EINPROGRESS))
 		return (error);
 
 	// Check for context and wait for 50 mSec at a time until time has
 	// expired or the command has finished.  If msleep can't be used, need
 	// to poll.
 	if (curthread->td_no_sleeping)
 		sleep_flag = NO_SLEEP;
 	getmicrouptime(&start_time);
 	if (mtx_owned(&sc->mpr_mtx) && sleep_flag == CAN_SLEEP) {
 		error = msleep(cm, &sc->mpr_mtx, 0, "mprwait", timeout*hz);
 		if (error == EWOULDBLOCK) {
 			/*
 			 * Record the actual elapsed time in the case of a
 			 * timeout for the message below.
 			 */
 			getmicrouptime(&cur_time);
 			timevalsub(&cur_time, &start_time);
 		}
 	} else {
 		while ((cm->cm_flags & MPR_CM_FLAGS_COMPLETE) == 0) {
 			mpr_intr_locked(sc);
 			if (sleep_flag == CAN_SLEEP)
 				pause("mprwait", hz/20);
 			else
 				DELAY(50000);
 		
 			getmicrouptime(&cur_time);
 			timevalsub(&cur_time, &start_time);
 			if (cur_time.tv_sec > timeout) {
 				error = EWOULDBLOCK;
 				break;
 			}
 		}
 	}
 
 	if (error == EWOULDBLOCK) {
 		if (cm->cm_timeout_handler == NULL) {
 			mpr_dprint(sc, MPR_FAULT, "Calling Reinit from %s, timeout=%d,"
 			    " elapsed=%jd\n", __func__, timeout,
 			    (intmax_t)cur_time.tv_sec);
 			rc = mpr_reinit(sc);
 			mpr_dprint(sc, MPR_FAULT, "Reinit %s\n", (rc == 0) ? "success" :
 			    "failed");
 		} else
 			cm->cm_timeout_handler(sc, cm);
 		if (sc->mpr_flags & MPR_FLAGS_REALLOCATED) {
 			/*
 			 * Tell the caller that we freed the command in a
 			 * reinit.
 			 */
 			*cmp = NULL;
 		}
 		error = ETIMEDOUT;
 	}
 	return (error);
 }
 
 /*
  * This is the routine to enqueue a command synchonously and poll for
  * completion.  Its use should be rare.
  */
 int
 mpr_request_polled(struct mpr_softc *sc, struct mpr_command **cmp)
 {
 	int error, rc;
 	struct timeval cur_time, start_time;
 	struct mpr_command *cm = *cmp;
 
 	error = 0;
 
 	cm->cm_flags |= MPR_CM_FLAGS_POLLED;
 	cm->cm_complete = NULL;
 	mpr_map_command(sc, cm);
 
 	getmicrouptime(&start_time);
 	while ((cm->cm_flags & MPR_CM_FLAGS_COMPLETE) == 0) {
 		mpr_intr_locked(sc);
 
 		if (mtx_owned(&sc->mpr_mtx))
 			msleep(&sc->msleep_fake_chan, &sc->mpr_mtx, 0,
 			    "mprpoll", hz/20);
 		else
 			pause("mprpoll", hz/20);
 
 		/*
 		 * Check for real-time timeout and fail if more than 60 seconds.
 		 */
 		getmicrouptime(&cur_time);
 		timevalsub(&cur_time, &start_time);
 		if (cur_time.tv_sec > 60) {
 			mpr_dprint(sc, MPR_FAULT, "polling failed\n");
 			error = ETIMEDOUT;
 			break;
 		}
 	}
 	cm->cm_state = MPR_CM_STATE_BUSY;
 	if (error) {
 		mpr_dprint(sc, MPR_FAULT, "Calling Reinit from %s\n", __func__);
 		rc = mpr_reinit(sc);
 		mpr_dprint(sc, MPR_FAULT, "Reinit %s\n", (rc == 0) ? "success" :
 		    "failed");
 
 		if (sc->mpr_flags & MPR_FLAGS_REALLOCATED) {
 			/*
 			 * Tell the caller that we freed the command in a
 			 * reinit.
 			 */
 			*cmp = NULL;
 		}
 	}
 	return (error);
 }
 
 /*
  * The MPT driver had a verbose interface for config pages.  In this driver,
  * reduce it to much simpler terms, similar to the Linux driver.
  */
 int
 mpr_read_config_page(struct mpr_softc *sc, struct mpr_config_params *params)
 {
 	MPI2_CONFIG_REQUEST *req;
 	struct mpr_command *cm;
 	int error;
 
 	if (sc->mpr_flags & MPR_FLAGS_BUSY) {
 		return (EBUSY);
 	}
 
 	cm = mpr_alloc_command(sc);
 	if (cm == NULL) {
 		return (EBUSY);
 	}
 
 	req = (MPI2_CONFIG_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_CONFIG;
 	req->Action = params->action;
 	req->SGLFlags = 0;
 	req->ChainOffset = 0;
 	req->PageAddress = params->page_address;
 	if (params->hdr.Struct.PageType == MPI2_CONFIG_PAGETYPE_EXTENDED) {
 		MPI2_CONFIG_EXTENDED_PAGE_HEADER *hdr;
 
 		hdr = &params->hdr.Ext;
 		req->ExtPageType = hdr->ExtPageType;
 		req->ExtPageLength = hdr->ExtPageLength;
 		req->Header.PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 		req->Header.PageLength = 0; /* Must be set to zero */
 		req->Header.PageNumber = hdr->PageNumber;
 		req->Header.PageVersion = hdr->PageVersion;
 	} else {
 		MPI2_CONFIG_PAGE_HEADER *hdr;
 
 		hdr = &params->hdr.Struct;
 		req->Header.PageType = hdr->PageType;
 		req->Header.PageNumber = hdr->PageNumber;
 		req->Header.PageLength = hdr->PageLength;
 		req->Header.PageVersion = hdr->PageVersion;
 	}
 
 	cm->cm_data = params->buffer;
 	cm->cm_length = params->length;
 	if (cm->cm_data != NULL) {
 		cm->cm_sge = &req->PageBufferSGE;
 		cm->cm_sglsize = sizeof(MPI2_SGE_IO_UNION);
 		cm->cm_flags = MPR_CM_FLAGS_SGE_SIMPLE | MPR_CM_FLAGS_DATAIN;
 	} else
 		cm->cm_sge = NULL;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	cm->cm_complete_data = params;
 	if (params->callback != NULL) {
 		cm->cm_complete = mpr_config_complete;
 		return (mpr_map_command(sc, cm));
 	} else {
 		error = mpr_wait_command(sc, &cm, 0, CAN_SLEEP);
 		if (error) {
 			mpr_dprint(sc, MPR_FAULT,
 			    "Error %d reading config page\n", error);
 			if (cm != NULL)
 				mpr_free_command(sc, cm);
 			return (error);
 		}
 		mpr_config_complete(sc, cm);
 	}
 
 	return (0);
 }
 
 int
 mpr_write_config_page(struct mpr_softc *sc, struct mpr_config_params *params)
 {
 	return (EINVAL);
 }
 
 static void
 mpr_config_complete(struct mpr_softc *sc, struct mpr_command *cm)
 {
 	MPI2_CONFIG_REPLY *reply;
 	struct mpr_config_params *params;
 
 	MPR_FUNCTRACE(sc);
 	params = cm->cm_complete_data;
 
 	if (cm->cm_data != NULL) {
 		bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap,
 		    BUS_DMASYNC_POSTREAD);
 		bus_dmamap_unload(sc->buffer_dmat, cm->cm_dmamap);
 	}
 
 	/*
 	 * XXX KDM need to do more error recovery?  This results in the
 	 * device in question not getting probed.
 	 */
 	if ((cm->cm_flags & MPR_CM_FLAGS_ERROR_MASK) != 0) {
 		params->status = MPI2_IOCSTATUS_BUSY;
 		goto done;
 	}
 
 	reply = (MPI2_CONFIG_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		params->status = MPI2_IOCSTATUS_BUSY;
 		goto done;
 	}
 	params->status = reply->IOCStatus;
 	if (params->hdr.Struct.PageType == MPI2_CONFIG_PAGETYPE_EXTENDED) {
 		params->hdr.Ext.ExtPageType = reply->ExtPageType;
 		params->hdr.Ext.ExtPageLength = reply->ExtPageLength;
 		params->hdr.Ext.PageType = reply->Header.PageType;
 		params->hdr.Ext.PageNumber = reply->Header.PageNumber;
 		params->hdr.Ext.PageVersion = reply->Header.PageVersion;
 	} else {
 		params->hdr.Struct.PageType = reply->Header.PageType;
 		params->hdr.Struct.PageNumber = reply->Header.PageNumber;
 		params->hdr.Struct.PageLength = reply->Header.PageLength;
 		params->hdr.Struct.PageVersion = reply->Header.PageVersion;
 	}
 
 done:
 	mpr_free_command(sc, cm);
 	if (params->callback != NULL)
 		params->callback(sc, params);
 
 	return;
 }
Index: head/sys/dev/mpr/mpr_pci.c
===================================================================
--- head/sys/dev/mpr/mpr_pci.c	(revision 365705)
+++ head/sys/dev/mpr/mpr_pci.c	(revision 365706)
@@ -1,489 +1,489 @@
 /*-
  * Copyright (c) 2009 Yahoo! Inc.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* PCI/PCI-X/PCIe bus interface for the Avago Tech (LSI) MPT3 controllers */
 
 /* TODO Move headers to mprvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/malloc.h>
 #include <sys/sysctl.h>
 #include <sys/uio.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 
 #include <dev/pci/pcireg.h>
 #include <dev/pci/pcivar.h>
 #include <dev/pci/pci_private.h>
 
 #include <dev/mpr/mpi/mpi2_type.h>
 #include <dev/mpr/mpi/mpi2.h>
 #include <dev/mpr/mpi/mpi2_ioc.h>
 #include <dev/mpr/mpi/mpi2_cnfg.h>
 #include <dev/mpr/mpi/mpi2_tool.h>
 #include <dev/mpr/mpi/mpi2_pci.h>
 
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <dev/mpr/mpr_ioctl.h>
 #include <dev/mpr/mprvar.h>
 
 static int	mpr_pci_probe(device_t);
 static int	mpr_pci_attach(device_t);
 static int	mpr_pci_detach(device_t);
 static int	mpr_pci_suspend(device_t);
 static int	mpr_pci_resume(device_t);
 static void	mpr_pci_free(struct mpr_softc *);
 static int	mpr_alloc_msix(struct mpr_softc *sc, int msgs);
 static int	mpr_alloc_msi(struct mpr_softc *sc, int msgs);
 static int	mpr_pci_alloc_interrupts(struct mpr_softc *sc);
 
 static device_method_t mpr_methods[] = {
 	DEVMETHOD(device_probe,		mpr_pci_probe),
 	DEVMETHOD(device_attach,	mpr_pci_attach),
 	DEVMETHOD(device_detach,	mpr_pci_detach),
 	DEVMETHOD(device_suspend,	mpr_pci_suspend),
 	DEVMETHOD(device_resume,	mpr_pci_resume),
 	DEVMETHOD(bus_print_child,	bus_generic_print_child),
 	DEVMETHOD(bus_driver_added,	bus_generic_driver_added),
 	{ 0, 0 }
 };
 
 static driver_t mpr_pci_driver = {
 	"mpr",
 	mpr_methods,
 	sizeof(struct mpr_softc)
 };
 
 struct mpr_ident {
 	uint16_t	vendor;
 	uint16_t	device;
 	uint16_t	subvendor;
 	uint16_t	subdevice;
 	u_int		flags;
 	const char	*desc;
 } mpr_identifiers[] = {
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3004,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3004" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3008,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3008" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3108_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3108_1" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3108_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3108_2" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3108_5,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3108_5" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI25_MFGPAGE_DEVID_SAS3108_6,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3108_6" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3216,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3216" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3224,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3224" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3316_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3316_1" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3316_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3316_2" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3324_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3324_1" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3324_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS3324_2" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3408,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3408" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3416,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3416" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3508,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3508" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3508_1,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3508_1" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3516,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3516" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3516_1,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3516_1" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3616,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3616" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3708,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3708" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_SAS3716,
 	    0xffff, 0xffff, MPR_FLAGS_GEN35_IOC,
 	    "Avago Technologies (LSI) SAS3716" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_INVALID0_SAS3816,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) INVALID0 SAS3816" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_CFG_SEC_SAS3816,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) CFG SEC SAS3816" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_HARD_SEC_SAS3816,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) HARD SEC SAS3816" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_INVALID1_SAS3816,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) INVALID1 SAS3816" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_INVALID0_SAS3916,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) INVALID0 SAS3916" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_CFG_SEC_SAS3916,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) CFG SEC SAS3916" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_HARD_SEC_SAS3916,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) HARD SEC SAS3916" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI26_MFGPAGE_DEVID_INVALID1_SAS3916,
 	    0xffff, 0xffff, (MPR_FLAGS_GEN35_IOC | MPR_FLAGS_SEA_IOC),
 	    "Broadcom Inc. (LSI) INVALID1 SAS3916" },
 	{ 0, 0, 0, 0, 0, NULL }
 };
 
 static devclass_t	mpr_devclass;
 DRIVER_MODULE(mpr, pci, mpr_pci_driver, mpr_devclass, 0, 0);
 MODULE_PNP_INFO("U16:vendor;U16:device;U16:subvendor;U16:subdevice;D:#", pci,
     mpr, mpr_identifiers, nitems(mpr_identifiers) - 1);
 
 MODULE_DEPEND(mpr, cam, 1, 1, 1);
 
 static struct mpr_ident *
 mpr_find_ident(device_t dev)
 {
 	struct mpr_ident *m;
 
 	for (m = mpr_identifiers; m->vendor != 0; m++) {
 		if (m->vendor != pci_get_vendor(dev))
 			continue;
 		if (m->device != pci_get_device(dev))
 			continue;
 		if ((m->subvendor != 0xffff) &&
 		    (m->subvendor != pci_get_subvendor(dev)))
 			continue;
 		if ((m->subdevice != 0xffff) &&
 		    (m->subdevice != pci_get_subdevice(dev)))
 			continue;
 		return (m);
 	}
 
 	return (NULL);
 }
 
 static int
 mpr_pci_probe(device_t dev)
 {
 	struct mpr_ident *id;
 
 	if ((id = mpr_find_ident(dev)) != NULL) {
 		device_set_desc(dev, id->desc);
 		return (BUS_PROBE_DEFAULT);
 	}
 	return (ENXIO);
 }
 
 static int
 mpr_pci_attach(device_t dev)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	struct mpr_softc *sc;
 	struct mpr_ident *m;
 	int error, i;
 
 	sc = device_get_softc(dev);
 	bzero(sc, sizeof(*sc));
 	sc->mpr_dev = dev;
 	m = mpr_find_ident(dev);
 	sc->mpr_flags = m->flags;
 
 	switch (m->device) {
 	case MPI26_MFGPAGE_DEVID_INVALID0_SAS3816:
 	case MPI26_MFGPAGE_DEVID_INVALID1_SAS3816:
 	case MPI26_MFGPAGE_DEVID_INVALID0_SAS3916:
 	case MPI26_MFGPAGE_DEVID_INVALID1_SAS3916:
 		mpr_printf(sc, "HBA is in Non Secure mode\n");
 		return (ENXIO);
 	case MPI26_MFGPAGE_DEVID_CFG_SEC_SAS3816:
 	case MPI26_MFGPAGE_DEVID_CFG_SEC_SAS3916:
 		mpr_printf(sc, "HBA is in Configurable Secure mode\n");
 		break;
 	default:
 		break;
 	}
 
 	mpr_get_tunables(sc);
 
 	/* Twiddle basic PCI config bits for a sanity check */
 	pci_enable_busmaster(dev);
 
 	for (i = 0; i < PCI_MAXMAPS_0; i++) {
 		sc->mpr_regs_rid = PCIR_BAR(i);
 
 		if ((sc->mpr_regs_resource = bus_alloc_resource_any(dev,
 		    SYS_RES_MEMORY, &sc->mpr_regs_rid, RF_ACTIVE)) != NULL)
 			break;
 	}
 
 	if (sc->mpr_regs_resource == NULL) {
 		mpr_printf(sc, "Cannot allocate PCI registers\n");
 		return (ENXIO);
 	}
 
 	sc->mpr_btag = rman_get_bustag(sc->mpr_regs_resource);
 	sc->mpr_bhandle = rman_get_bushandle(sc->mpr_regs_resource);
 
 	/* Allocate the parent DMA tag */
 	bus_dma_template_init(&t, bus_get_dma_tag(dev));
 	if (bus_dma_template_tag(&t, &sc->mpr_parent_dmat)) {
 		mpr_printf(sc, "Cannot allocate parent DMA tag\n");
 		mpr_pci_free(sc);
 		return (ENOMEM);
 	}
 
 	if (((error = mpr_pci_alloc_interrupts(sc)) != 0) ||
 	    ((error = mpr_attach(sc)) != 0))
 		mpr_pci_free(sc);
 
 	return (error);
 }
 
 /*
  * Allocate, but don't assign interrupts early.  Doing it before requesting
  * the IOCFacts message informs the firmware that we want to do MSI-X
  * multiqueue.  We might not use all of the available messages, but there's
  * no reason to re-alloc if we don't.
  */
 int
 mpr_pci_alloc_interrupts(struct mpr_softc *sc)
 {
 	device_t dev;
 	int error, msgs;
 
 	dev = sc->mpr_dev;
 	error = 0;
 	msgs = 0;
 
 	if (sc->disable_msix == 0) {
 		msgs = pci_msix_count(dev);
 		mpr_dprint(sc, MPR_INIT, "Counted %d MSI-X messages\n", msgs);
 		msgs = min(msgs, sc->max_msix);
 		msgs = min(msgs, MPR_MSIX_MAX);
 		msgs = min(msgs, 1);	/* XXX */
 		if (msgs != 0) {
 			mpr_dprint(sc, MPR_INIT, "Attempting to allocate %d "
 			    "MSI-X messages\n", msgs);
 			error = mpr_alloc_msix(sc, msgs);
 		}
 	}
 	if (((error != 0) || (msgs == 0)) && (sc->disable_msi == 0)) {
 		msgs = pci_msi_count(dev);
 		mpr_dprint(sc, MPR_INIT, "Counted %d MSI messages\n", msgs);
 		msgs = min(msgs, MPR_MSI_MAX);
 		if (msgs != 0) {
 			mpr_dprint(sc, MPR_INIT, "Attempting to allocated %d "
 			    "MSI messages\n", MPR_MSI_MAX);
 			error = mpr_alloc_msi(sc, MPR_MSI_MAX);
 		}
 	}
 	if ((error != 0) || (msgs == 0)) {
 		/*
 		 * If neither MSI or MSI-X are available, assume legacy INTx.
 		 * This also implies that there will be only 1 queue.
 		 */
 		mpr_dprint(sc, MPR_INIT, "Falling back to legacy INTx\n");
 		sc->mpr_flags |= MPR_FLAGS_INTX;
 		msgs = 1;
 	} else
 		sc->mpr_flags |= MPR_FLAGS_MSI;
 
 	sc->msi_msgs = msgs;
 	mpr_dprint(sc, MPR_INIT, "Allocated %d interrupts\n", msgs);
 
 	return (error);
 }
 
 int
 mpr_pci_setup_interrupts(struct mpr_softc *sc)
 {
 	device_t dev;
 	struct mpr_queue *q;
 	void *ihandler;
 	int i, error, rid, initial_rid;
 
 	dev = sc->mpr_dev;
 	error = ENXIO;
 
 	if (sc->mpr_flags & MPR_FLAGS_INTX) {
 		initial_rid = 0;
 		ihandler = mpr_intr;
 	} else if (sc->mpr_flags & MPR_FLAGS_MSI) {
 		initial_rid = 1;
 		ihandler = mpr_intr_msi;
 	} else {
 		mpr_dprint(sc, MPR_ERROR|MPR_INIT,
 		    "Unable to set up interrupts\n");
 		return (EINVAL);
 	}
 
 	for (i = 0; i < sc->msi_msgs; i++) {
 		q = &sc->queues[i];
 		rid = i + initial_rid;
 		q->irq_rid = rid;
 		q->irq = bus_alloc_resource_any(dev, SYS_RES_IRQ,
 		    &q->irq_rid, RF_ACTIVE);
 		if (q->irq == NULL) {
 			mpr_dprint(sc, MPR_ERROR|MPR_INIT,
 			    "Cannot allocate interrupt RID %d\n", rid);
 			sc->msi_msgs = i;
 			break;
 		}
 		error = bus_setup_intr(dev, q->irq,
 		    INTR_TYPE_BIO | INTR_MPSAFE, NULL, ihandler,
 		    sc, &q->intrhand);
 		if (error) {
 			mpr_dprint(sc, MPR_ERROR|MPR_INIT,
 			    "Cannot setup interrupt RID %d\n", rid);
 			sc->msi_msgs = i;
 			break;
 		}
 	}
 
         mpr_dprint(sc, MPR_INIT, "Set up %d interrupts\n", sc->msi_msgs);
 	return (error);
 }
 
 static int
 mpr_pci_detach(device_t dev)
 {
 	struct mpr_softc *sc;
 	int error;
 
 	sc = device_get_softc(dev);
 
 	if ((error = mpr_free(sc)) != 0)
 		return (error);
 
 	mpr_pci_free(sc);
 	return (0);
 }
 
 void
 mpr_pci_free_interrupts(struct mpr_softc *sc)
 {
 	struct mpr_queue *q;
 	int i;
 
 	if (sc->queues == NULL)
 		return;
 
 	for (i = 0; i < sc->msi_msgs; i++) {
 		q = &sc->queues[i];
 		if (q->irq != NULL) {
 			bus_teardown_intr(sc->mpr_dev, q->irq,
 			    q->intrhand);
 			bus_release_resource(sc->mpr_dev, SYS_RES_IRQ,
 			    q->irq_rid, q->irq);
 		}
 	}
 }
 
 static void
 mpr_pci_free(struct mpr_softc *sc)
 {
 
 	if (sc->mpr_parent_dmat != NULL) {
 		bus_dma_tag_destroy(sc->mpr_parent_dmat);
 	}
 
 	mpr_pci_free_interrupts(sc);
 
 	if (sc->mpr_flags & MPR_FLAGS_MSI)
 		pci_release_msi(sc->mpr_dev);
 
 	if (sc->mpr_regs_resource != NULL) {
 		bus_release_resource(sc->mpr_dev, SYS_RES_MEMORY,
 		    sc->mpr_regs_rid, sc->mpr_regs_resource);
 	}
 
 	return;
 }
 
 static int
 mpr_pci_suspend(device_t dev)
 {
 	return (EINVAL);
 }
 
 static int
 mpr_pci_resume(device_t dev)
 {
 	return (EINVAL);
 }
 
 static int
 mpr_alloc_msix(struct mpr_softc *sc, int msgs)
 {
 	int error;
 
 	error = pci_alloc_msix(sc->mpr_dev, &msgs);
 	return (error);
 }
 
 static int
 mpr_alloc_msi(struct mpr_softc *sc, int msgs)
 {
 	int error;
 
 	error = pci_alloc_msi(sc->mpr_dev, &msgs);
 	return (error);
 }
 
 int
 mpr_pci_restore(struct mpr_softc *sc)
 {
 	struct pci_devinfo *dinfo;
 
 	mpr_dprint(sc, MPR_TRACE, "%s\n", __func__);
 
 	dinfo = device_get_ivars(sc->mpr_dev);
 	if (dinfo == NULL) {
 		mpr_dprint(sc, MPR_FAULT, "%s: NULL dinfo\n", __func__);
 		return (EINVAL);
 	}
 
 	pci_cfg_restore(sc->mpr_dev, dinfo);
 	return (0);
 }
Index: head/sys/dev/mpr/mpr_user.c
===================================================================
--- head/sys/dev/mpr/mpr_user.c	(revision 365705)
+++ head/sys/dev/mpr/mpr_user.c	(revision 365706)
@@ -1,2605 +1,2605 @@
 /*-
  * Copyright (c) 2008 Yahoo!, Inc.
  * All rights reserved.
  * Written by: John Baldwin <jhb@FreeBSD.org>
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the author nor the names of any co-contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Broadcom Inc. (LSI) MPT-Fusion Host Adapter FreeBSD userland interface
  */
 /*-
  * Copyright (c) 2011-2015 LSI Corp.
  * Copyright (c) 2013-2016 Avago Technologies
  * Copyright 2000-2020 Broadcom Inc.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Broadcom Inc. (LSI) MPT-Fusion Host Adapter FreeBSD
  *
  * $FreeBSD$
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* TODO Move headers to mprvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/selinfo.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/bio.h>
 #include <sys/abi_compat.h>
 #include <sys/malloc.h>
 #include <sys/uio.h>
 #include <sys/sysctl.h>
 #include <sys/ioccom.h>
 #include <sys/endian.h>
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <sys/taskqueue.h>
 #include <sys/proc.h>
 #include <sys/sysent.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 
 #include <cam/cam.h>
 #include <cam/cam_ccb.h>
 
 #include <dev/mpr/mpi/mpi2_type.h>
 #include <dev/mpr/mpi/mpi2.h>
 #include <dev/mpr/mpi/mpi2_ioc.h>
 #include <dev/mpr/mpi/mpi2_cnfg.h>
 #include <dev/mpr/mpi/mpi2_init.h>
 #include <dev/mpr/mpi/mpi2_tool.h>
 #include <dev/mpr/mpi/mpi2_pci.h>
 #include <dev/mpr/mpr_ioctl.h>
 #include <dev/mpr/mprvar.h>
 #include <dev/mpr/mpr_table.h>
 #include <dev/mpr/mpr_sas.h>
 #include <dev/pci/pcivar.h>
 #include <dev/pci/pcireg.h>
 
 static d_open_t		mpr_open;
 static d_close_t	mpr_close;
 static d_ioctl_t	mpr_ioctl_devsw;
 
 static struct cdevsw mpr_cdevsw = {
 	.d_version =	D_VERSION,
 	.d_flags =	0,
 	.d_open =	mpr_open,
 	.d_close =	mpr_close,
 	.d_ioctl =	mpr_ioctl_devsw,
 	.d_name =	"mpr",
 };
 
 typedef int (mpr_user_f)(struct mpr_command *, struct mpr_usr_command *);
 static mpr_user_f	mpi_pre_ioc_facts;
 static mpr_user_f	mpi_pre_port_facts;
 static mpr_user_f	mpi_pre_fw_download;
 static mpr_user_f	mpi_pre_fw_upload;
 static mpr_user_f	mpi_pre_sata_passthrough;
 static mpr_user_f	mpi_pre_smp_passthrough;
 static mpr_user_f	mpi_pre_config;
 static mpr_user_f	mpi_pre_sas_io_unit_control;
 
 static int mpr_user_read_cfg_header(struct mpr_softc *,
     struct mpr_cfg_page_req *);
 static int mpr_user_read_cfg_page(struct mpr_softc *,
     struct mpr_cfg_page_req *, void *);
 static int mpr_user_read_extcfg_header(struct mpr_softc *,
     struct mpr_ext_cfg_page_req *);
 static int mpr_user_read_extcfg_page(struct mpr_softc *,
     struct mpr_ext_cfg_page_req *, void *);
 static int mpr_user_write_cfg_page(struct mpr_softc *,
     struct mpr_cfg_page_req *, void *);
 static int mpr_user_setup_request(struct mpr_command *,
     struct mpr_usr_command *);
 static int mpr_user_command(struct mpr_softc *, struct mpr_usr_command *);
 
 static int mpr_user_pass_thru(struct mpr_softc *sc, mpr_pass_thru_t *data);
 static void mpr_user_get_adapter_data(struct mpr_softc *sc,
     mpr_adapter_data_t *data);
 static void mpr_user_read_pci_info(struct mpr_softc *sc, mpr_pci_info_t *data);
 static uint8_t mpr_get_fw_diag_buffer_number(struct mpr_softc *sc,
     uint32_t unique_id);
 static int mpr_post_fw_diag_buffer(struct mpr_softc *sc,
     mpr_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code);
 static int mpr_release_fw_diag_buffer(struct mpr_softc *sc,
     mpr_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code,
     uint32_t diag_type);
 static int mpr_diag_register(struct mpr_softc *sc,
     mpr_fw_diag_register_t *diag_register, uint32_t *return_code);
 static int mpr_diag_unregister(struct mpr_softc *sc,
     mpr_fw_diag_unregister_t *diag_unregister, uint32_t *return_code);
 static int mpr_diag_query(struct mpr_softc *sc, mpr_fw_diag_query_t *diag_query,
     uint32_t *return_code);
 static int mpr_diag_read_buffer(struct mpr_softc *sc,
     mpr_diag_read_buffer_t *diag_read_buffer, uint8_t *ioctl_buf,
     uint32_t *return_code);
 static int mpr_diag_release(struct mpr_softc *sc,
     mpr_fw_diag_release_t *diag_release, uint32_t *return_code);
 static int mpr_do_diag_action(struct mpr_softc *sc, uint32_t action,
     uint8_t *diag_action, uint32_t length, uint32_t *return_code);
 static int mpr_user_diag_action(struct mpr_softc *sc, mpr_diag_action_t *data);
 static void mpr_user_event_query(struct mpr_softc *sc, mpr_event_query_t *data);
 static void mpr_user_event_enable(struct mpr_softc *sc,
     mpr_event_enable_t *data);
 static int mpr_user_event_report(struct mpr_softc *sc,
     mpr_event_report_t *data);
 static int mpr_user_reg_access(struct mpr_softc *sc, mpr_reg_access_t *data);
 static int mpr_user_btdh(struct mpr_softc *sc, mpr_btdh_mapping_t *data);
 
 static MALLOC_DEFINE(M_MPRUSER, "mpr_user", "Buffers for mpr(4) ioctls");
 
 /*
  * MPI functions that support IEEE SGLs for SAS3.
  */
 static uint8_t ieee_sgl_func_list[] = {
 	MPI2_FUNCTION_SCSI_IO_REQUEST,
 	MPI2_FUNCTION_RAID_SCSI_IO_PASSTHROUGH,
 	MPI2_FUNCTION_SMP_PASSTHROUGH,
 	MPI2_FUNCTION_SATA_PASSTHROUGH,
 	MPI2_FUNCTION_FW_UPLOAD,
 	MPI2_FUNCTION_FW_DOWNLOAD,
 	MPI2_FUNCTION_TARGET_ASSIST,
 	MPI2_FUNCTION_TARGET_STATUS_SEND,
 	MPI2_FUNCTION_TOOLBOX
 };
 
 int
 mpr_attach_user(struct mpr_softc *sc)
 {
 	int unit;
 
 	unit = device_get_unit(sc->mpr_dev);
 	sc->mpr_cdev = make_dev(&mpr_cdevsw, unit, UID_ROOT, GID_OPERATOR, 0640,
 	    "mpr%d", unit);
 
 	if (sc->mpr_cdev == NULL)
 		return (ENOMEM);
 
 	sc->mpr_cdev->si_drv1 = sc;
 	return (0);
 }
 
 void
 mpr_detach_user(struct mpr_softc *sc)
 {
 
 	/* XXX: do a purge of pending requests? */
 	if (sc->mpr_cdev != NULL)
 		destroy_dev(sc->mpr_cdev);
 }
 
 static int
 mpr_open(struct cdev *dev, int flags, int fmt, struct thread *td)
 {
 
 	return (0);
 }
 
 static int
 mpr_close(struct cdev *dev, int flags, int fmt, struct thread *td)
 {
 
 	return (0);
 }
 
 static int
 mpr_user_read_cfg_header(struct mpr_softc *sc,
     struct mpr_cfg_page_req *page_req)
 {
 	MPI2_CONFIG_PAGE_HEADER *hdr;
 	struct mpr_config_params params;
 	int	    error;
 
 	hdr = &params.hdr.Struct;
 	params.action = MPI2_CONFIG_ACTION_PAGE_HEADER;
 	params.page_address = le32toh(page_req->page_address);
 	hdr->PageVersion = 0;
 	hdr->PageLength = 0;
 	hdr->PageNumber = page_req->header.PageNumber;
 	hdr->PageType = page_req->header.PageType;
 	params.buffer = NULL;
 	params.length = 0;
 	params.callback = NULL;
 
 	if ((error = mpr_read_config_page(sc, &params)) != 0) {
 		/*
 		 * Leave the request. Without resetting the chip, it's
 		 * still owned by it and we'll just get into trouble
 		 * freeing it now. Mark it as abandoned so that if it
 		 * shows up later it can be freed.
 		 */
 		mpr_printf(sc, "read_cfg_header timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	if ((page_req->ioc_status & MPI2_IOCSTATUS_MASK) ==
 	    MPI2_IOCSTATUS_SUCCESS) {
 		bcopy(hdr, &page_req->header, sizeof(page_req->header));
 	}
 
 	return (0);
 }
 
 static int
 mpr_user_read_cfg_page(struct mpr_softc *sc, struct mpr_cfg_page_req *page_req,
     void *buf)
 {
 	MPI2_CONFIG_PAGE_HEADER *reqhdr, *hdr;
 	struct mpr_config_params params;
 	int	      error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Struct;
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageLength = reqhdr->PageLength;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->PageType = reqhdr->PageType & MPI2_CONFIG_PAGETYPE_MASK;
 	params.action = MPI2_CONFIG_ACTION_PAGE_READ_CURRENT;
 	params.page_address = le32toh(page_req->page_address);
 	params.buffer = buf;
 	params.length = le32toh(page_req->len);
 	params.callback = NULL;
 
 	if ((error = mpr_read_config_page(sc, &params)) != 0) {
 		mpr_printf(sc, "mpr_user_read_cfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 static int
 mpr_user_read_extcfg_header(struct mpr_softc *sc,
     struct mpr_ext_cfg_page_req *ext_page_req)
 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER *hdr;
 	struct mpr_config_params params;
 	int	    error;
 
 	hdr = &params.hdr.Ext;
 	params.action = MPI2_CONFIG_ACTION_PAGE_HEADER;
 	hdr->PageVersion = ext_page_req->header.PageVersion;
 	hdr->PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 	hdr->ExtPageLength = 0;
 	hdr->PageNumber = ext_page_req->header.PageNumber;
 	hdr->ExtPageType = ext_page_req->header.ExtPageType;
 	params.page_address = le32toh(ext_page_req->page_address);
 	params.buffer = NULL;
 	params.length = 0;
 	params.callback = NULL;
 
 	if ((error = mpr_read_config_page(sc, &params)) != 0) {
 		/*
 		 * Leave the request. Without resetting the chip, it's
 		 * still owned by it and we'll just get into trouble
 		 * freeing it now. Mark it as abandoned so that if it
 		 * shows up later it can be freed.
 		 */
 		mpr_printf(sc, "mpr_user_read_extcfg_header timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	ext_page_req->ioc_status = htole16(params.status);
 	if ((ext_page_req->ioc_status & MPI2_IOCSTATUS_MASK) ==
 	    MPI2_IOCSTATUS_SUCCESS) {
 		ext_page_req->header.PageVersion = hdr->PageVersion;
 		ext_page_req->header.PageNumber = hdr->PageNumber;
 		ext_page_req->header.PageType = hdr->PageType;
 		ext_page_req->header.ExtPageLength = hdr->ExtPageLength;
 		ext_page_req->header.ExtPageType = hdr->ExtPageType;
 	}
 
 	return (0);
 }
 
 static int
 mpr_user_read_extcfg_page(struct mpr_softc *sc,
     struct mpr_ext_cfg_page_req *ext_page_req, void *buf)
 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER *reqhdr, *hdr;
 	struct mpr_config_params params;
 	int error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Ext;
 	params.action = MPI2_CONFIG_ACTION_PAGE_READ_CURRENT;
 	params.page_address = le32toh(ext_page_req->page_address);
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->ExtPageType = reqhdr->ExtPageType;
 	hdr->ExtPageLength = reqhdr->ExtPageLength;
 	params.buffer = buf;
 	params.length = le32toh(ext_page_req->len);
 	params.callback = NULL;
 
 	if ((error = mpr_read_config_page(sc, &params)) != 0) {
 		mpr_printf(sc, "mpr_user_read_extcfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	ext_page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 static int
 mpr_user_write_cfg_page(struct mpr_softc *sc,
     struct mpr_cfg_page_req *page_req, void *buf)
 {
 	MPI2_CONFIG_PAGE_HEADER *reqhdr, *hdr;
 	struct mpr_config_params params;
 	u_int	      hdr_attr;
 	int	      error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Struct;
 	hdr_attr = reqhdr->PageType & MPI2_CONFIG_PAGEATTR_MASK;
 	if (hdr_attr != MPI2_CONFIG_PAGEATTR_CHANGEABLE &&
 	    hdr_attr != MPI2_CONFIG_PAGEATTR_PERSISTENT) {
 		mpr_printf(sc, "page type 0x%x not changeable\n",
 			reqhdr->PageType & MPI2_CONFIG_PAGETYPE_MASK);
 		return (EINVAL);
 	}
 
 	/*
 	 * There isn't any point in restoring stripped out attributes
 	 * if you then mask them going down to issue the request.
 	 */
 
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageLength = reqhdr->PageLength;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->PageType = reqhdr->PageType;
 	params.action = MPI2_CONFIG_ACTION_PAGE_WRITE_CURRENT;
 	params.page_address = le32toh(page_req->page_address);
 	params.buffer = buf;
 	params.length = le32toh(page_req->len);
 	params.callback = NULL;
 
 	if ((error = mpr_write_config_page(sc, &params)) != 0) {
 		mpr_printf(sc, "mpr_write_cfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 void
 mpr_init_sge(struct mpr_command *cm, void *req, void *sge)
 {
 	int off, space;
 
 	space = (int)cm->cm_sc->reqframesz;
 	off = (uintptr_t)sge - (uintptr_t)req;
 
 	KASSERT(off < space, ("bad pointers %p %p, off %d, space %d",
             req, sge, off, space));
 
 	cm->cm_sge = sge;
 	cm->cm_sglsize = space - off;
 }
 
 /*
  * Prepare the mpr_command for an IOC_FACTS request.
  */
 static int
 mpi_pre_ioc_facts(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_IOC_FACTS_REQUEST *req = (void *)cm->cm_req;
 	MPI2_IOC_FACTS_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * Prepare the mpr_command for a PORT_FACTS request.
  */
 static int
 mpi_pre_port_facts(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_PORT_FACTS_REQUEST *req = (void *)cm->cm_req;
 	MPI2_PORT_FACTS_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * Prepare the mpr_command for a FW_DOWNLOAD request.
  */
 static int
 mpi_pre_fw_download(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI25_FW_DOWNLOAD_REQUEST *req = (void *)cm->cm_req;
 	MPI2_FW_DOWNLOAD_REPLY *rpl;
 	int error;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	if (cmd->len == 0)
 		return (EINVAL);
 
 	error = copyin(cmd->buf, cm->cm_data, cmd->len);
 	if (error != 0)
 		return (error);
 
 	mpr_init_sge(cm, req, &req->SGL);
 
 	/*
 	 * For now, the F/W image must be provided in a single request.
 	 */
 	if ((req->MsgFlags & MPI2_FW_DOWNLOAD_MSGFLGS_LAST_SEGMENT) == 0)
 		return (EINVAL);
 	if (req->TotalImageSize != cmd->len)
 		return (EINVAL);
 
 	req->ImageOffset = 0;
 	req->ImageSize = cmd->len;
 
 	cm->cm_flags |= MPR_CM_FLAGS_DATAOUT;
 
 	return (mpr_push_ieee_sge(cm, &req->SGL, 0));
 }
 
 /*
  * Prepare the mpr_command for a FW_UPLOAD request.
  */
 static int
 mpi_pre_fw_upload(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI25_FW_UPLOAD_REQUEST *req = (void *)cm->cm_req;
 	MPI2_FW_UPLOAD_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpr_init_sge(cm, req, &req->SGL);
 	if (cmd->len == 0) {
 		/* Perhaps just asking what the size of the fw is? */
 		return (0);
 	}
 
 	req->ImageOffset = 0;
 	req->ImageSize = cmd->len;
 
 	cm->cm_flags |= MPR_CM_FLAGS_DATAIN;
 
 	return (mpr_push_ieee_sge(cm, &req->SGL, 0));
 }
 
 /*
  * Prepare the mpr_command for a SATA_PASSTHROUGH request.
  */
 static int
 mpi_pre_sata_passthrough(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_SATA_PASSTHROUGH_REQUEST *req = (void *)cm->cm_req;
 	MPI2_SATA_PASSTHROUGH_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpr_init_sge(cm, req, &req->SGL);
 	return (0);
 }
 
 /*
  * Prepare the mpr_command for a SMP_PASSTHROUGH request.
  */
 static int
 mpi_pre_smp_passthrough(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_SMP_PASSTHROUGH_REQUEST *req = (void *)cm->cm_req;
 	MPI2_SMP_PASSTHROUGH_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpr_init_sge(cm, req, &req->SGL);
 	return (0);
 }
 
 /*
  * Prepare the mpr_command for a CONFIG request.
  */
 static int
 mpi_pre_config(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_CONFIG_REQUEST *req = (void *)cm->cm_req;
 	MPI2_CONFIG_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpr_init_sge(cm, req, &req->PageBufferSGE);
 	return (0);
 }
 
 /*
  * Prepare the mpr_command for a SAS_IO_UNIT_CONTROL request.
  */
 static int
 mpi_pre_sas_io_unit_control(struct mpr_command *cm,
 			     struct mpr_usr_command *cmd)
 {
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * A set of functions to prepare an mpr_command for the various
  * supported requests.
  */
 struct mpr_user_func {
 	U8		Function;
 	mpr_user_f	*f_pre;
 } mpr_user_func_list[] = {
 	{ MPI2_FUNCTION_IOC_FACTS,		mpi_pre_ioc_facts },
 	{ MPI2_FUNCTION_PORT_FACTS,		mpi_pre_port_facts },
 	{ MPI2_FUNCTION_FW_DOWNLOAD, 		mpi_pre_fw_download },
 	{ MPI2_FUNCTION_FW_UPLOAD,		mpi_pre_fw_upload },
 	{ MPI2_FUNCTION_SATA_PASSTHROUGH,	mpi_pre_sata_passthrough },
 	{ MPI2_FUNCTION_SMP_PASSTHROUGH,	mpi_pre_smp_passthrough},
 	{ MPI2_FUNCTION_CONFIG,			mpi_pre_config},
 	{ MPI2_FUNCTION_SAS_IO_UNIT_CONTROL,	mpi_pre_sas_io_unit_control },
 	{ 0xFF,					NULL } /* list end */
 };
 
 static int
 mpr_user_setup_request(struct mpr_command *cm, struct mpr_usr_command *cmd)
 {
 	MPI2_REQUEST_HEADER *hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;	
 	struct mpr_user_func *f;
 
 	for (f = mpr_user_func_list; f->f_pre != NULL; f++) {
 		if (hdr->Function == f->Function)
 			return (f->f_pre(cm, cmd));
 	}
 	return (EINVAL);
 }	
 
 static int
 mpr_user_command(struct mpr_softc *sc, struct mpr_usr_command *cmd)
 {
 	MPI2_REQUEST_HEADER *hdr;	
 	MPI2_DEFAULT_REPLY *rpl = NULL;
 	void *buf = NULL;
 	struct mpr_command *cm = NULL;
 	int err = 0;
 	int sz;
 
 	mpr_lock(sc);
 	cm = mpr_alloc_command(sc);
 
 	if (cm == NULL) {
 		mpr_printf(sc, "%s: no mpr requests\n", __func__);
 		err = ENOMEM;
 		goto RetFree;
 	}
 	mpr_unlock(sc);
 
 	hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;
 
 	mpr_dprint(sc, MPR_USER, "%s: req %p %d  rpl %p %d\n", __func__,
 	    cmd->req, cmd->req_len, cmd->rpl, cmd->rpl_len);
 
 	if (cmd->req_len > (int)sc->reqframesz) {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 	err = copyin(cmd->req, hdr, cmd->req_len);
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	mpr_dprint(sc, MPR_USER, "%s: Function %02X MsgFlags %02X\n", __func__,
 	    hdr->Function, hdr->MsgFlags);
 
 	if (cmd->len > 0) {
 		buf = malloc(cmd->len, M_MPRUSER, M_WAITOK|M_ZERO);
 		cm->cm_data = buf;
 		cm->cm_length = cmd->len;
 	} else {
 		cm->cm_data = NULL;
 		cm->cm_length = 0;
 	}
 
 	cm->cm_flags = MPR_CM_FLAGS_SGE_SIMPLE;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	err = mpr_user_setup_request(cm, cmd);
 	if (err == EINVAL) {
 		mpr_printf(sc, "%s: unsupported parameter or unsupported "
 		    "function in request (function = 0x%X)\n", __func__,
 		    hdr->Function);
 	}
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	mpr_lock(sc);
 	err = mpr_wait_command(sc, &cm, 30, CAN_SLEEP);
 
 	if (err || (cm == NULL)) {
 		mpr_printf(sc, "%s: invalid request: error %d\n",
 		    __func__, err);
 		goto RetFree;
 	}
 
 	if (cm != NULL)
 		rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 	if (rpl != NULL)
 		sz = rpl->MsgLength * 4;
 	else
 		sz = 0;
 
 	if (sz > cmd->rpl_len) {
 		mpr_printf(sc, "%s: user reply buffer (%d) smaller than "
 		    "returned buffer (%d)\n", __func__, cmd->rpl_len, sz);
 		sz = cmd->rpl_len;
 	}	
 
 	mpr_unlock(sc);
 	copyout(rpl, cmd->rpl, sz);
 	if (buf != NULL)
 		copyout(buf, cmd->buf, cmd->len);
 	mpr_dprint(sc, MPR_USER, "%s: reply size %d\n", __func__, sz);
 
 RetFreeUnlocked:
 	mpr_lock(sc);
 RetFree:
 	if (cm != NULL)
 		mpr_free_command(sc, cm);
 	mpr_unlock(sc);
 	if (buf != NULL)
 		free(buf, M_MPRUSER);
 	return (err);
 }
 
 static int
 mpr_user_pass_thru(struct mpr_softc *sc, mpr_pass_thru_t *data)
 {
 	MPI2_REQUEST_HEADER	*hdr, tmphdr;	
 	MPI2_DEFAULT_REPLY	*rpl;
 	Mpi26NVMeEncapsulatedErrorReply_t *nvme_error_reply = NULL;
 	Mpi26NVMeEncapsulatedRequest_t *nvme_encap_request = NULL;
 	struct mpr_command	*cm = NULL;
 	int			i, err = 0, dir = 0, sz;
 	uint8_t			tool, function = 0;
 	u_int			sense_len;
 	struct mprsas_target	*targ = NULL;
 
 	/*
 	 * Only allow one passthru command at a time.  Use the MPR_FLAGS_BUSY
 	 * bit to denote that a passthru is being processed.
 	 */
 	mpr_lock(sc);
 	if (sc->mpr_flags & MPR_FLAGS_BUSY) {
 		mpr_dprint(sc, MPR_USER, "%s: Only one passthru command "
 		    "allowed at a single time.", __func__);
 		mpr_unlock(sc);
 		return (EBUSY);
 	}
 	sc->mpr_flags |= MPR_FLAGS_BUSY;
 	mpr_unlock(sc);
 
 	/*
 	 * Do some validation on data direction.  Valid cases are:
 	 *    1) DataSize is 0 and direction is NONE
 	 *    2) DataSize is non-zero and one of:
 	 *        a) direction is READ or
 	 *        b) direction is WRITE or
 	 *        c) direction is BOTH and DataOutSize is non-zero
 	 * If valid and the direction is BOTH, change the direction to READ.
 	 * if valid and the direction is not BOTH, make sure DataOutSize is 0.
 	 */
 	if (((data->DataSize == 0) &&
 	    (data->DataDirection == MPR_PASS_THRU_DIRECTION_NONE)) ||
 	    ((data->DataSize != 0) &&
 	    ((data->DataDirection == MPR_PASS_THRU_DIRECTION_READ) ||
 	    (data->DataDirection == MPR_PASS_THRU_DIRECTION_WRITE) ||
 	    ((data->DataDirection == MPR_PASS_THRU_DIRECTION_BOTH) &&
 	    (data->DataOutSize != 0))))) {
 		if (data->DataDirection == MPR_PASS_THRU_DIRECTION_BOTH)
 			data->DataDirection = MPR_PASS_THRU_DIRECTION_READ;
 		else
 			data->DataOutSize = 0;
 	} else {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 
 	mpr_dprint(sc, MPR_USER, "%s: req 0x%jx %d  rpl 0x%jx %d "
 	    "data in 0x%jx %d data out 0x%jx %d data dir %d\n", __func__,
 	    data->PtrRequest, data->RequestSize, data->PtrReply,
 	    data->ReplySize, data->PtrData, data->DataSize,
 	    data->PtrDataOut, data->DataOutSize, data->DataDirection);
 
 	/*
 	 * copy in the header so we know what we're dealing with before we
 	 * commit to allocating a command for it.
 	 */
 	err = copyin(PTRIN(data->PtrRequest), &tmphdr, data->RequestSize);
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	if (data->RequestSize > (int)sc->reqframesz) {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 
 	function = tmphdr.Function;
 	mpr_dprint(sc, MPR_USER, "%s: Function %02X MsgFlags %02X\n", __func__,
 	    function, tmphdr.MsgFlags);
 
 	/*
 	 * Handle a passthru TM request.
 	 */
 	if (function == MPI2_FUNCTION_SCSI_TASK_MGMT) {
 		MPI2_SCSI_TASK_MANAGE_REQUEST	*task;
 
 		mpr_lock(sc);
 		cm = mprsas_alloc_tm(sc);
 		if (cm == NULL) {
 			err = EINVAL;
 			goto Ret;
 		}
 
 		/* Copy the header in.  Only a small fixup is needed. */
 		task = (MPI2_SCSI_TASK_MANAGE_REQUEST *)cm->cm_req;
 		bcopy(&tmphdr, task, data->RequestSize);
 		task->TaskMID = cm->cm_desc.Default.SMID;
 
 		cm->cm_data = NULL;
 		cm->cm_complete = NULL;
 		cm->cm_complete_data = NULL;
 
 		targ = mprsas_find_target_by_handle(sc->sassc, 0,
 		    task->DevHandle);
 		if (targ == NULL) {
 			mpr_dprint(sc, MPR_INFO,
 			   "%s %d : invalid handle for requested TM 0x%x \n",
 			   __func__, __LINE__, task->DevHandle);
 			err = 1;
 		} else {
 			mprsas_prepare_for_tm(sc, cm, targ, CAM_LUN_WILDCARD);
 			err = mpr_wait_command(sc, &cm, 30, CAN_SLEEP);
 		}
 
 		if (err != 0) {
 			err = EIO;
 			mpr_dprint(sc, MPR_FAULT, "%s: task management failed",
 			    __func__);
 		}
 		/*
 		 * Copy the reply data and sense data to user space.
 		 */
 		if ((cm != NULL) && (cm->cm_reply != NULL)) {
 			rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 			sz = rpl->MsgLength * 4;
 
 			if (sz > data->ReplySize) {
 				mpr_printf(sc, "%s: user reply buffer (%d) "
 				    "smaller than returned buffer (%d)\n",
 				    __func__, data->ReplySize, sz);
 			}
 			mpr_unlock(sc);
 			copyout(cm->cm_reply, PTRIN(data->PtrReply),
 			    data->ReplySize);
 			mpr_lock(sc);
 		}
 		mprsas_free_tm(sc, cm);
 		goto Ret;
 	}
 
 	mpr_lock(sc);
 	cm = mpr_alloc_command(sc);
 
 	if (cm == NULL) {
 		mpr_printf(sc, "%s: no mpr requests\n", __func__);
 		err = ENOMEM;
 		goto Ret;
 	}
 	mpr_unlock(sc);
 
 	hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;
 	bcopy(&tmphdr, hdr, data->RequestSize);
 
 	/*
 	 * Do some checking to make sure the IOCTL request contains a valid
 	 * request.  Then set the SGL info.
 	 */
 	mpr_init_sge(cm, hdr, (void *)((uint8_t *)hdr + data->RequestSize));
 
 	/*
 	 * Set up for read, write or both.  From check above, DataOutSize will
 	 * be 0 if direction is READ or WRITE, but it will have some non-zero
 	 * value if the direction is BOTH.  So, just use the biggest size to get
 	 * the cm_data buffer size.  If direction is BOTH, 2 SGLs need to be set
 	 * up; the first is for the request and the second will contain the
 	 * response data. cm_out_len needs to be set here and this will be used
 	 * when the SGLs are set up.
 	 */
 	cm->cm_data = NULL;
 	cm->cm_length = MAX(data->DataSize, data->DataOutSize);
 	cm->cm_out_len = data->DataOutSize;
 	cm->cm_flags = 0;
 	if (cm->cm_length != 0) {
 		cm->cm_data = malloc(cm->cm_length, M_MPRUSER, M_WAITOK |
 		    M_ZERO);
 		cm->cm_flags = MPR_CM_FLAGS_DATAIN;
 		if (data->DataOutSize) {
 			cm->cm_flags |= MPR_CM_FLAGS_DATAOUT;
 			err = copyin(PTRIN(data->PtrDataOut),
 			    cm->cm_data, data->DataOutSize);
 		} else if (data->DataDirection ==
 		    MPR_PASS_THRU_DIRECTION_WRITE) {
 			cm->cm_flags = MPR_CM_FLAGS_DATAOUT;
 			err = copyin(PTRIN(data->PtrData),
 			    cm->cm_data, data->DataSize);
 		}
 		if (err != 0)
 			mpr_dprint(sc, MPR_FAULT, "%s: failed to copy IOCTL "
 			    "data from user space\n", __func__);
 	}
 	/*
 	 * Set this flag only if processing a command that does not need an
 	 * IEEE SGL.  The CLI Tool within the Toolbox uses IEEE SGLs, so clear
 	 * the flag only for that tool if processing a Toolbox function.
 	 */
 	cm->cm_flags |= MPR_CM_FLAGS_SGE_SIMPLE;
 	for (i = 0; i < sizeof (ieee_sgl_func_list); i++) {
 		if (function == ieee_sgl_func_list[i]) {
 			if (function == MPI2_FUNCTION_TOOLBOX)
 			{
 				tool = (uint8_t)hdr->FunctionDependent1;
 				if (tool != MPI2_TOOLBOX_DIAGNOSTIC_CLI_TOOL)
 					break;
 			}
 			cm->cm_flags &= ~MPR_CM_FLAGS_SGE_SIMPLE;
 			break;
 		}
 	}
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	if (function == MPI2_FUNCTION_NVME_ENCAPSULATED) {
 		nvme_encap_request =
 		    (Mpi26NVMeEncapsulatedRequest_t *)cm->cm_req;
 		cm->cm_desc.Default.RequestFlags =
 		    MPI26_REQ_DESCRIPT_FLAGS_PCIE_ENCAPSULATED;
 
 		/*
 		 * Get the Physical Address of the sense buffer.
 		 * Save the user's Error Response buffer address and use that
 		 *   field to hold the sense buffer address.
 		 * Clear the internal sense buffer, which will potentially hold
 		 *   the Completion Queue Entry on return, or 0 if no Entry.
 		 * Build the PRPs and set direction bits.
 		 * Send the request.
 		 */
 		cm->nvme_error_response =
 		    (uint64_t *)(uintptr_t)(((uint64_t)nvme_encap_request->
 		    ErrorResponseBaseAddress.High << 32) |
 		    (uint64_t)nvme_encap_request->
 		    ErrorResponseBaseAddress.Low);
 		nvme_encap_request->ErrorResponseBaseAddress.High =
 		    htole32((uint32_t)((uint64_t)cm->cm_sense_busaddr >> 32));
 		nvme_encap_request->ErrorResponseBaseAddress.Low =
 		    htole32(cm->cm_sense_busaddr);
 		memset(cm->cm_sense, 0, NVME_ERROR_RESPONSE_SIZE);
 		mpr_build_nvme_prp(sc, cm, nvme_encap_request, cm->cm_data,
 		    data->DataSize, data->DataOutSize);
 	}
 
 	/*
 	 * Set up Sense buffer and SGL offset for IO passthru.  SCSI IO request
 	 * uses SCSI IO or Fast Path SCSI IO descriptor.
 	 */
 	if ((function == MPI2_FUNCTION_SCSI_IO_REQUEST) ||
 	    (function == MPI2_FUNCTION_RAID_SCSI_IO_PASSTHROUGH)) {
 		MPI2_SCSI_IO_REQUEST	*scsi_io_req;
 
 		scsi_io_req = (MPI2_SCSI_IO_REQUEST *)hdr;
 		/*
 		 * Put SGE for data and data_out buffer at the end of
 		 * scsi_io_request message header (64 bytes in total).
 		 * Following above SGEs, the residual space will be used by
 		 * sense data.
 		 */
 		scsi_io_req->SenseBufferLength = (uint8_t)(data->RequestSize -
 		    64);
 		scsi_io_req->SenseBufferLowAddress =
 		    htole32(cm->cm_sense_busaddr);
 
 		/*
 		 * Set SGLOffset0 value.  This is the number of dwords that SGL
 		 * is offset from the beginning of MPI2_SCSI_IO_REQUEST struct.
 		 */
 		scsi_io_req->SGLOffset0 = 24;
 
 		/*
 		 * Setup descriptor info.  RAID passthrough must use the
 		 * default request descriptor which is already set, so if this
 		 * is a SCSI IO request, change the descriptor to SCSI IO or
 		 * Fast Path SCSI IO.  Also, if this is a SCSI IO request,
 		 * handle the reply in the mprsas_scsio_complete function.
 		 */
 		if (function == MPI2_FUNCTION_SCSI_IO_REQUEST) {
 			targ = mprsas_find_target_by_handle(sc->sassc, 0,
 			    scsi_io_req->DevHandle);
 
 			if (!targ) {
 				printf("No Target found for handle %d\n",
 				    scsi_io_req->DevHandle);
 				err = EINVAL;
 				goto RetFreeUnlocked;
 			}
 
 			if (targ->scsi_req_desc_type ==
 			    MPI25_REQ_DESCRIPT_FLAGS_FAST_PATH_SCSI_IO) {
 				cm->cm_desc.FastPathSCSIIO.RequestFlags =
 				    MPI25_REQ_DESCRIPT_FLAGS_FAST_PATH_SCSI_IO;
 				if (!sc->atomic_desc_capable) {
 					cm->cm_desc.FastPathSCSIIO.DevHandle =
 					    scsi_io_req->DevHandle;
 				}
 				scsi_io_req->IoFlags |=
 				    MPI25_SCSIIO_IOFLAGS_FAST_PATH;
 			} else {
 				cm->cm_desc.SCSIIO.RequestFlags =
 				    MPI2_REQ_DESCRIPT_FLAGS_SCSI_IO;
 				if (!sc->atomic_desc_capable) {
 					cm->cm_desc.SCSIIO.DevHandle =
 					    scsi_io_req->DevHandle;
 				}
 			}
 
 			/*
 			 * Make sure the DevHandle is not 0 because this is a
 			 * likely error.
 			 */
 			if (scsi_io_req->DevHandle == 0) {
 				err = EINVAL;
 				goto RetFreeUnlocked;
 			}
 		}
 	}
 
 	mpr_lock(sc);
 
 	err = mpr_wait_command(sc, &cm, 30, CAN_SLEEP);
 
 	if (err || (cm == NULL)) {
 		mpr_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    err);
 		goto RetFree;
 	}
 
 	/*
 	 * Sync the DMA data, if any.  Then copy the data to user space.
 	 */
 	if (cm->cm_data != NULL) {
 		if (cm->cm_flags & MPR_CM_FLAGS_DATAIN)
 			dir = BUS_DMASYNC_POSTREAD;
 		else if (cm->cm_flags & MPR_CM_FLAGS_DATAOUT)
 			dir = BUS_DMASYNC_POSTWRITE;
 		bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap, dir);
 		bus_dmamap_unload(sc->buffer_dmat, cm->cm_dmamap);
 
 		if (cm->cm_flags & MPR_CM_FLAGS_DATAIN) {
 			mpr_unlock(sc);
 			err = copyout(cm->cm_data,
 			    PTRIN(data->PtrData), data->DataSize);
 			mpr_lock(sc);
 			if (err != 0)
 				mpr_dprint(sc, MPR_FAULT, "%s: failed to copy "
 				    "IOCTL data to user space\n", __func__);
 		}
 	}
 
 	/*
 	 * Copy the reply data and sense data to user space.
 	 */
 	if (cm->cm_reply != NULL) {
 		rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 		sz = rpl->MsgLength * 4;
 
 		if (sz > data->ReplySize) {
 			mpr_printf(sc, "%s: user reply buffer (%d) smaller "
 			    "than returned buffer (%d)\n", __func__,
 			    data->ReplySize, sz);
 		}
 		mpr_unlock(sc);
 		copyout(cm->cm_reply, PTRIN(data->PtrReply), data->ReplySize);
 		mpr_lock(sc);
 
 		if ((function == MPI2_FUNCTION_SCSI_IO_REQUEST) ||
 		    (function == MPI2_FUNCTION_RAID_SCSI_IO_PASSTHROUGH)) {
 			if (((MPI2_SCSI_IO_REPLY *)rpl)->SCSIState &
 			    MPI2_SCSI_STATE_AUTOSENSE_VALID) {
 				sense_len =
 				    MIN((le32toh(((MPI2_SCSI_IO_REPLY *)rpl)->
 				    SenseCount)), sizeof(struct
 				    scsi_sense_data));
 				mpr_unlock(sc);
 				copyout(cm->cm_sense, (PTRIN(data->PtrReply +
 				    sizeof(MPI2_SCSI_IO_REPLY))), sense_len);
 				mpr_lock(sc);
 			}
 		}
 
 		/*
 		 * Copy out the NVMe Error Reponse to user. The Error Response
 		 * buffer is given by the user, but a sense buffer is used to
 		 * get that data from the IOC. The user's
 		 * ErrorResponseBaseAddress is saved in the
 		 * 'nvme_error_response' field before the command because that
 		 * field is set to a sense buffer. When the command is
 		 * complete, the Error Response data from the IOC is copied to
 		 * that user address after it is checked for validity.
 		 * Also note that 'sense' buffers are not defined for
 		 * NVMe commands. Sense terminalogy is only used here so that
 		 * the same IOCTL structure and sense buffers can be used for
 		 * NVMe.
 		 */
 		if (function == MPI2_FUNCTION_NVME_ENCAPSULATED) {
 			if (cm->nvme_error_response == NULL) {
 				mpr_dprint(sc, MPR_INFO, "NVMe Error Response "
 				    "buffer is NULL. Response data will not be "
 				    "returned.\n");
 				mpr_unlock(sc);
 				goto RetFreeUnlocked;
 			}
 
 			nvme_error_reply =
 			    (Mpi26NVMeEncapsulatedErrorReply_t *)cm->cm_reply;
 			sz = MIN(le32toh(nvme_error_reply->ErrorResponseCount),
 			    NVME_ERROR_RESPONSE_SIZE);
 			mpr_unlock(sc);
 			copyout(cm->cm_sense,
 			    (PTRIN(data->PtrReply +
 			    sizeof(MPI2_SCSI_IO_REPLY))), sz);
 			mpr_lock(sc);
 		}
 	}
 	mpr_unlock(sc);
 
 RetFreeUnlocked:
 	mpr_lock(sc);
 
 RetFree:
 	if (cm != NULL) {
 		if (cm->cm_data)
 			free(cm->cm_data, M_MPRUSER);
 		mpr_free_command(sc, cm);
 	}
 Ret:
 	sc->mpr_flags &= ~MPR_FLAGS_BUSY;
 	mpr_unlock(sc);
 
 	return (err);
 }
 
 static void
 mpr_user_get_adapter_data(struct mpr_softc *sc, mpr_adapter_data_t *data)
 {
 	Mpi2ConfigReply_t	mpi_reply;
 	Mpi2BiosPage3_t		config_page;
 
 	/*
 	 * Use the PCI interface functions to get the Bus, Device, and Function
 	 * information.
 	 */
 	data->PciInformation.u.bits.BusNumber = pci_get_bus(sc->mpr_dev);
 	data->PciInformation.u.bits.DeviceNumber = pci_get_slot(sc->mpr_dev);
 	data->PciInformation.u.bits.FunctionNumber =
 	    pci_get_function(sc->mpr_dev);
 
 	/*
 	 * Get the FW version that should already be saved in IOC Facts.
 	 */
 	data->MpiFirmwareVersion = sc->facts->FWVersion.Word;
 
 	/*
 	 * General device info.
 	 */
 	if (sc->mpr_flags & MPR_FLAGS_GEN35_IOC)
 		data->AdapterType = MPRIOCTL_ADAPTER_TYPE_SAS35;
 	else
 		data->AdapterType = MPRIOCTL_ADAPTER_TYPE_SAS3;
 	data->PCIDeviceHwId = pci_get_device(sc->mpr_dev);
 	data->PCIDeviceHwRev = pci_read_config(sc->mpr_dev, PCIR_REVID, 1);
 	data->SubSystemId = pci_get_subdevice(sc->mpr_dev);
 	data->SubsystemVendorId = pci_get_subvendor(sc->mpr_dev);
 
 	/*
 	 * Get the driver version.
 	 */
 	strcpy((char *)&data->DriverVersion[0], MPR_DRIVER_VERSION);
 
 	/*
 	 * Need to get BIOS Config Page 3 for the BIOS Version.
 	 */
 	data->BiosVersion = 0;
 	mpr_lock(sc);
 	if (mpr_config_get_bios_pg3(sc, &mpi_reply, &config_page))
 		printf("%s: Error while retrieving BIOS Version\n", __func__);
 	else
 		data->BiosVersion = config_page.BiosVersion;
 	mpr_unlock(sc);
 }
 
 static void
 mpr_user_read_pci_info(struct mpr_softc *sc, mpr_pci_info_t *data)
 {
 	int	i;
 
 	/*
 	 * Use the PCI interface functions to get the Bus, Device, and Function
 	 * information.
 	 */
 	data->BusNumber = pci_get_bus(sc->mpr_dev);
 	data->DeviceNumber = pci_get_slot(sc->mpr_dev);
 	data->FunctionNumber = pci_get_function(sc->mpr_dev);
 
 	/*
 	 * Now get the interrupt vector and the pci header.  The vector can
 	 * only be 0 right now.  The header is the first 256 bytes of config
 	 * space.
 	 */
 	data->InterruptVector = 0;
 	for (i = 0; i < sizeof (data->PciHeader); i++) {
 		data->PciHeader[i] = pci_read_config(sc->mpr_dev, i, 1);
 	}
 }
 
 static uint8_t
 mpr_get_fw_diag_buffer_number(struct mpr_softc *sc, uint32_t unique_id)
 {
 	uint8_t	index;
 
 	for (index = 0; index < MPI2_DIAG_BUF_TYPE_COUNT; index++) {
 		if (sc->fw_diag_buffer_list[index].unique_id == unique_id) {
 			return (index);
 		}
 	}
 
 	return (MPR_FW_DIAGNOSTIC_UID_NOT_FOUND);
 }
 
 static int
 mpr_post_fw_diag_buffer(struct mpr_softc *sc,
     mpr_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code)
 {
 	MPI2_DIAG_BUFFER_POST_REQUEST	*req;
 	MPI2_DIAG_BUFFER_POST_REPLY	*reply;
 	struct mpr_command		*cm = NULL;
 	int				i, status;
 
 	/*
 	 * If buffer is not enabled, just leave.
 	 */
 	*return_code = MPR_FW_DIAG_ERROR_POST_FAILED;
 	if (!pBuffer->enabled) {
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Clear some flags initially.
 	 */
 	pBuffer->force_release = FALSE;
 	pBuffer->valid_data = FALSE;
 	pBuffer->owned_by_firmware = FALSE;
 
 	/*
 	 * Get a command.
 	 */
 	cm = mpr_alloc_command(sc);
 	if (cm == NULL) {
 		mpr_printf(sc, "%s: no mpr requests\n", __func__);
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Build the request for releasing the FW Diag Buffer and send it.
 	 */
 	req = (MPI2_DIAG_BUFFER_POST_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_DIAG_BUFFER_POST;
 	req->BufferType = pBuffer->buffer_type;
 	req->ExtendedType = pBuffer->extended_type;
 	req->BufferLength = pBuffer->size;
 	for (i = 0; i < (sizeof(req->ProductSpecific) / 4); i++)
 		req->ProductSpecific[i] = pBuffer->product_specific[i];
 	mpr_from_u64(sc->fw_diag_busaddr, &req->BufferAddress);
 	cm->cm_data = NULL;
 	cm->cm_length = 0;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_complete_data = NULL;
 
 	/*
 	 * Send command synchronously.
 	 */
 	status = mpr_wait_command(sc, &cm, 30, CAN_SLEEP);
 	if (status || (cm == NULL)) {
 		mpr_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    status);
 		status = MPR_DIAG_FAILURE;
 		goto done;
 	}
 
 	/*
 	 * Process POST reply.
 	 */
 	reply = (MPI2_DIAG_BUFFER_POST_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		mpr_printf(sc, "%s: reply is NULL, probably due to "
 		    "reinitialization", __func__);
 		status = MPR_DIAG_FAILURE;
 		goto done;
 	}
 
 	if ((le16toh(reply->IOCStatus) & MPI2_IOCSTATUS_MASK) !=
 	    MPI2_IOCSTATUS_SUCCESS) {
 		status = MPR_DIAG_FAILURE;
 		mpr_dprint(sc, MPR_FAULT, "%s: post of FW  Diag Buffer failed "
 		    "with IOCStatus = 0x%x, IOCLogInfo = 0x%x and "
 		    "TransferLength = 0x%x\n", __func__,
 		    le16toh(reply->IOCStatus), le32toh(reply->IOCLogInfo),
 		    le32toh(reply->TransferLength));
 		goto done;
 	}
 
 	/*
 	 * Post was successful.
 	 */
 	pBuffer->valid_data = TRUE;
 	pBuffer->owned_by_firmware = TRUE;
 	*return_code = MPR_FW_DIAG_ERROR_SUCCESS;
 	status = MPR_DIAG_SUCCESS;
 
 done:
 	if (cm != NULL)
 		mpr_free_command(sc, cm);
 	return (status);
 }
 
 static int
 mpr_release_fw_diag_buffer(struct mpr_softc *sc,
     mpr_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code,
     uint32_t diag_type)
 {
 	MPI2_DIAG_RELEASE_REQUEST	*req;
 	MPI2_DIAG_RELEASE_REPLY		*reply;
 	struct mpr_command		*cm = NULL;
 	int				status;
 
 	/*
 	 * If buffer is not enabled, just leave.
 	 */
 	*return_code = MPR_FW_DIAG_ERROR_RELEASE_FAILED;
 	if (!pBuffer->enabled) {
 		mpr_dprint(sc, MPR_USER, "%s: This buffer type is not "
 		    "supported by the IOC", __func__);
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Clear some flags initially.
 	 */
 	pBuffer->force_release = FALSE;
 	pBuffer->valid_data = FALSE;
 	pBuffer->owned_by_firmware = FALSE;
 
 	/*
 	 * Get a command.
 	 */
 	cm = mpr_alloc_command(sc);
 	if (cm == NULL) {
 		mpr_printf(sc, "%s: no mpr requests\n", __func__);
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Build the request for releasing the FW Diag Buffer and send it.
 	 */
 	req = (MPI2_DIAG_RELEASE_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_DIAG_RELEASE;
 	req->BufferType = pBuffer->buffer_type;
 	cm->cm_data = NULL;
 	cm->cm_length = 0;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_complete_data = NULL;
 
 	/*
 	 * Send command synchronously.
 	 */
 	status = mpr_wait_command(sc, &cm, 30, CAN_SLEEP);
 	if (status || (cm == NULL)) {
 		mpr_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    status);
 		status = MPR_DIAG_FAILURE;
 		goto done;
 	}
 
 	/*
 	 * Process RELEASE reply.
 	 */
 	reply = (MPI2_DIAG_RELEASE_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		mpr_printf(sc, "%s: reply is NULL, probably due to "
 		    "reinitialization", __func__);
 		status = MPR_DIAG_FAILURE;
 		goto done;
 	}
 	if (((le16toh(reply->IOCStatus) & MPI2_IOCSTATUS_MASK) !=
 	    MPI2_IOCSTATUS_SUCCESS) || pBuffer->owned_by_firmware) {
 		status = MPR_DIAG_FAILURE;
 		mpr_dprint(sc, MPR_FAULT, "%s: release of FW Diag Buffer "
 		    "failed with IOCStatus = 0x%x and IOCLogInfo = 0x%x\n",
 		    __func__, le16toh(reply->IOCStatus),
 		    le32toh(reply->IOCLogInfo));
 		goto done;
 	}
 
 	/*
 	 * Release was successful.
 	 */
 	*return_code = MPR_FW_DIAG_ERROR_SUCCESS;
 	status = MPR_DIAG_SUCCESS;
 
 	/*
 	 * If this was for an UNREGISTER diag type command, clear the unique ID.
 	 */
 	if (diag_type == MPR_FW_DIAG_TYPE_UNREGISTER) {
 		pBuffer->unique_id = MPR_FW_DIAG_INVALID_UID;
 	}
 
 done:
 	if (cm != NULL)
 		mpr_free_command(sc, cm);
 
 	return (status);
 }
 
 static int
 mpr_diag_register(struct mpr_softc *sc, mpr_fw_diag_register_t *diag_register,
     uint32_t *return_code)
 {
-	bus_dma_tag_template_t		t;
+	bus_dma_template_t		t;
 	mpr_fw_diagnostic_buffer_t	*pBuffer;
 	struct mpr_busdma_context	*ctx;
 	uint8_t				extended_type, buffer_type, i;
 	uint32_t			buffer_size;
 	uint32_t			unique_id;
 	int				status;
 	int				error;
 
 	extended_type = diag_register->ExtendedType;
 	buffer_type = diag_register->BufferType;
 	buffer_size = diag_register->RequestedBufferSize;
 	unique_id = diag_register->UniqueId;
 	ctx = NULL;
 	error = 0;
 
 	/*
 	 * Check for valid buffer type
 	 */
 	if (buffer_type >= MPI2_DIAG_BUF_TYPE_COUNT) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should not be found.  If it is, the ID is already in use.
 	 */
 	i = mpr_get_fw_diag_buffer_number(sc, unique_id);
 	pBuffer = &sc->fw_diag_buffer_list[buffer_type];
 	if (i != MPR_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * The buffer's unique ID should not be registered yet, and the given
 	 * unique ID cannot be 0.
 	 */
 	if ((pBuffer->unique_id != MPR_FW_DIAG_INVALID_UID) ||
 	    (unique_id == MPR_FW_DIAG_INVALID_UID)) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * If this buffer is already posted as immediate, just change owner.
 	 */
 	if (pBuffer->immediate && pBuffer->owned_by_firmware &&
 	    (pBuffer->unique_id == MPR_FW_DIAG_INVALID_UID)) {
 		pBuffer->immediate = FALSE;
 		pBuffer->unique_id = unique_id;
 		return (MPR_DIAG_SUCCESS);
 	}
 
 	/*
 	 * Post a new buffer after checking if it's enabled.  The DMA buffer
 	 * that is allocated will be contiguous (nsegments = 1).
 	 */
 	if (!pBuffer->enabled) {
 		*return_code = MPR_FW_DIAG_ERROR_NO_BUFFER;
 		return (MPR_DIAG_FAILURE);
 	}
 	bus_dma_template_init(&t, sc->mpr_parent_dmat);
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = buffer_size;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT),
+	    BD_MAXSIZE(buffer_size), BD_MAXSEGSIZE(buffer_size),
+	    BD_NSEGMENTS(1));
 	if (bus_dma_template_tag(&t, &sc->fw_diag_dmat)) {
 		mpr_dprint(sc, MPR_ERROR,
 		    "Cannot allocate FW diag buffer DMA tag\n");
 		*return_code = MPR_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPR_DIAG_FAILURE;
 		goto bailout;
 	}
         if (bus_dmamem_alloc(sc->fw_diag_dmat, (void **)&sc->fw_diag_buffer,
 	    BUS_DMA_NOWAIT, &sc->fw_diag_map)) {
 		mpr_dprint(sc, MPR_ERROR,
 		    "Cannot allocate FW diag buffer memory\n");
 		*return_code = MPR_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPR_DIAG_FAILURE;
 		goto bailout;
 	}
 	bzero(sc->fw_diag_buffer, buffer_size);
 
 	ctx = malloc(sizeof(*ctx), M_MPR, M_WAITOK | M_ZERO);
 	ctx->addr = &sc->fw_diag_busaddr;
 	ctx->buffer_dmat = sc->fw_diag_dmat;
 	ctx->buffer_dmamap = sc->fw_diag_map;
 	ctx->softc = sc;
 	error = bus_dmamap_load(sc->fw_diag_dmat, sc->fw_diag_map,
 	    sc->fw_diag_buffer, buffer_size, mpr_memaddr_wait_cb,
 	    ctx, 0);
 	if (error == EINPROGRESS) {
 		/* XXX KDM */
 		device_printf(sc->mpr_dev, "%s: Deferred bus_dmamap_load\n",
 		    __func__);
 		/*
 		 * Wait for the load to complete.  If we're interrupted,
 		 * bail out.
 		 */
 		mpr_lock(sc);
 		if (ctx->completed == 0) {
 			error = msleep(ctx, &sc->mpr_mtx, PCATCH, "mprwait", 0);
 			if (error != 0) {
 				/*
 				 * We got an error from msleep(9).  This is
 				 * most likely due to a signal.  Tell
 				 * mpr_memaddr_wait_cb() that we've abandoned
 				 * the context, so it needs to clean up when
 				 * it is called.
 				 */
 				ctx->abandoned = 1;
 
 				/* The callback will free this memory */
 				ctx = NULL;
 				mpr_unlock(sc);
 
 				device_printf(sc->mpr_dev, "Cannot "
 				    "bus_dmamap_load FW diag buffer, error = "
 				    "%d returned from msleep\n", error);
 				*return_code = MPR_FW_DIAG_ERROR_NO_BUFFER;
 				status = MPR_DIAG_FAILURE;
 				goto bailout;
 			}
 		}
 		mpr_unlock(sc);
 	} 
 
 	if ((error != 0) || (ctx->error != 0)) {
 		device_printf(sc->mpr_dev, "Cannot bus_dmamap_load FW diag "
 		    "buffer, %serror = %d\n", error ? "" : "callback ",
 		    error ? error : ctx->error);
 		*return_code = MPR_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPR_DIAG_FAILURE;
 		goto bailout;
 	}
 
 	bus_dmamap_sync(sc->fw_diag_dmat, sc->fw_diag_map, BUS_DMASYNC_PREREAD);
 
 	pBuffer->size = buffer_size;
 
 	/*
 	 * Copy the given info to the diag buffer and post the buffer.
 	 */
 	pBuffer->buffer_type = buffer_type;
 	pBuffer->immediate = FALSE;
 	if (buffer_type == MPI2_DIAG_BUF_TYPE_TRACE) {
 		for (i = 0; i < (sizeof (pBuffer->product_specific) / 4);
 		    i++) {
 			pBuffer->product_specific[i] =
 			    diag_register->ProductSpecific[i];
 		}
 	}
 	pBuffer->extended_type = extended_type;
 	pBuffer->unique_id = unique_id;
 	status = mpr_post_fw_diag_buffer(sc, pBuffer, return_code);
 
 bailout:
 
 	/*
 	 * In case there was a failure, free the DMA buffer.
 	 */
 	if (status == MPR_DIAG_FAILURE) {
 		if (sc->fw_diag_busaddr != 0) {
 			bus_dmamap_unload(sc->fw_diag_dmat, sc->fw_diag_map);
 			sc->fw_diag_busaddr = 0;
 		}
 		if (sc->fw_diag_buffer != NULL) {
 			bus_dmamem_free(sc->fw_diag_dmat, sc->fw_diag_buffer,
 			    sc->fw_diag_map);
 			sc->fw_diag_buffer = NULL;
 		}
 		if (sc->fw_diag_dmat != NULL) {
 			bus_dma_tag_destroy(sc->fw_diag_dmat);
 			sc->fw_diag_dmat = NULL;
 		}
 	}
 
 	if (ctx != NULL)
 		free(ctx, M_MPR);
 
 	return (status);
 }
 
 static int
 mpr_diag_unregister(struct mpr_softc *sc,
     mpr_fw_diag_unregister_t *diag_unregister, uint32_t *return_code)
 {
 	mpr_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_unregister->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mpr_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPR_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * Try to release the buffer from FW before freeing it.  If release
 	 * fails, don't free the DMA buffer in case FW tries to access it
 	 * later.  If buffer is not owned by firmware, can't release it.
 	 */
 	if (!pBuffer->owned_by_firmware) {
 		status = MPR_DIAG_SUCCESS;
 	} else {
 		status = mpr_release_fw_diag_buffer(sc, pBuffer, return_code,
 		    MPR_FW_DIAG_TYPE_UNREGISTER);
 	}
 
 	/*
 	 * At this point, return the current status no matter what happens with
 	 * the DMA buffer.
 	 */
 	pBuffer->unique_id = MPR_FW_DIAG_INVALID_UID;
 	if (status == MPR_DIAG_SUCCESS) {
 		if (sc->fw_diag_busaddr != 0) {
 			bus_dmamap_unload(sc->fw_diag_dmat, sc->fw_diag_map);
 			sc->fw_diag_busaddr = 0;
 		}
 		if (sc->fw_diag_buffer != NULL) {
 			bus_dmamem_free(sc->fw_diag_dmat, sc->fw_diag_buffer,
 			    sc->fw_diag_map);
 			sc->fw_diag_buffer = NULL;
 		}
 		if (sc->fw_diag_dmat != NULL) {
 			bus_dma_tag_destroy(sc->fw_diag_dmat);
 			sc->fw_diag_dmat = NULL;
 		}
 	}
 
 	return (status);
 }
 
 static int
 mpr_diag_query(struct mpr_softc *sc, mpr_fw_diag_query_t *diag_query,
     uint32_t *return_code)
 {
 	mpr_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 
 	unique_id = diag_query->UniqueId;
 
 	/*
 	 * If ID is valid, query on ID.
 	 * If ID is invalid, query on buffer type.
 	 */
 	if (unique_id == MPR_FW_DIAG_INVALID_UID) {
 		i = diag_query->BufferType;
 		if (i >= MPI2_DIAG_BUF_TYPE_COUNT) {
 			*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 			return (MPR_DIAG_FAILURE);
 		}
 	} else {
 		i = mpr_get_fw_diag_buffer_number(sc, unique_id);
 		if (i == MPR_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 			*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 			return (MPR_DIAG_FAILURE);
 		}
 	}
 
 	/*
 	 * Fill query structure with the diag buffer info.
 	 */
 	pBuffer = &sc->fw_diag_buffer_list[i];
 	diag_query->BufferType = pBuffer->buffer_type;
 	diag_query->ExtendedType = pBuffer->extended_type;
 	if (diag_query->BufferType == MPI2_DIAG_BUF_TYPE_TRACE) {
 		for (i = 0; i < (sizeof(diag_query->ProductSpecific) / 4);
 		    i++) {
 			diag_query->ProductSpecific[i] =
 			    pBuffer->product_specific[i];
 		}
 	}
 	diag_query->TotalBufferSize = pBuffer->size;
 	diag_query->DriverAddedBufferSize = 0;
 	diag_query->UniqueId = pBuffer->unique_id;
 	diag_query->ApplicationFlags = 0;
 	diag_query->DiagnosticFlags = 0;
 
 	/*
 	 * Set/Clear application flags
 	 */
 	if (pBuffer->immediate) {
 		diag_query->ApplicationFlags &= ~MPR_FW_DIAG_FLAG_APP_OWNED;
 	} else {
 		diag_query->ApplicationFlags |= MPR_FW_DIAG_FLAG_APP_OWNED;
 	}
 	if (pBuffer->valid_data || pBuffer->owned_by_firmware) {
 		diag_query->ApplicationFlags |= MPR_FW_DIAG_FLAG_BUFFER_VALID;
 	} else {
 		diag_query->ApplicationFlags &= ~MPR_FW_DIAG_FLAG_BUFFER_VALID;
 	}
 	if (pBuffer->owned_by_firmware) {
 		diag_query->ApplicationFlags |=
 		    MPR_FW_DIAG_FLAG_FW_BUFFER_ACCESS;
 	} else {
 		diag_query->ApplicationFlags &=
 		    ~MPR_FW_DIAG_FLAG_FW_BUFFER_ACCESS;
 	}
 
 	return (MPR_DIAG_SUCCESS);
 }
 
 static int
 mpr_diag_read_buffer(struct mpr_softc *sc,
     mpr_diag_read_buffer_t *diag_read_buffer, uint8_t *ioctl_buf,
     uint32_t *return_code)
 {
 	mpr_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i, *pData;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_read_buffer->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mpr_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPR_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * Make sure requested read is within limits
 	 */
 	if (diag_read_buffer->StartingOffset + diag_read_buffer->BytesToRead >
 	    pBuffer->size) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/* Sync the DMA map before we copy to userland. */
 	bus_dmamap_sync(sc->fw_diag_dmat, sc->fw_diag_map,
 	    BUS_DMASYNC_POSTREAD);
 
 	/*
 	 * Copy the requested data from DMA to the diag_read_buffer.  The DMA
 	 * buffer that was allocated is one contiguous buffer.
 	 */
 	pData = (uint8_t *)(sc->fw_diag_buffer +
 	    diag_read_buffer->StartingOffset);
 	if (copyout(pData, ioctl_buf, diag_read_buffer->BytesToRead) != 0)
 		return (MPR_DIAG_FAILURE);
 	diag_read_buffer->Status = 0;
 
 	/*
 	 * Set or clear the Force Release flag.
 	 */
 	if (pBuffer->force_release) {
 		diag_read_buffer->Flags |= MPR_FW_DIAG_FLAG_FORCE_RELEASE;
 	} else {
 		diag_read_buffer->Flags &= ~MPR_FW_DIAG_FLAG_FORCE_RELEASE;
 	}
 
 	/*
 	 * If buffer is to be reregistered, make sure it's not already owned by
 	 * firmware first.
 	 */
 	status = MPR_DIAG_SUCCESS;
 	if (!pBuffer->owned_by_firmware) {
 		if (diag_read_buffer->Flags & MPR_FW_DIAG_FLAG_REREGISTER) {
 			status = mpr_post_fw_diag_buffer(sc, pBuffer,
 			    return_code);
 		}
 	}
 
 	return (status);
 }
 
 static int
 mpr_diag_release(struct mpr_softc *sc, mpr_fw_diag_release_t *diag_release,
     uint32_t *return_code)
 {
 	mpr_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_release->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mpr_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPR_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPR_FW_DIAG_ERROR_INVALID_UID;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * If buffer is not owned by firmware, it's already been released.
 	 */
 	if (!pBuffer->owned_by_firmware) {
 		*return_code = MPR_FW_DIAG_ERROR_ALREADY_RELEASED;
 		return (MPR_DIAG_FAILURE);
 	}
 
 	/*
 	 * Release the buffer.
 	 */
 	status = mpr_release_fw_diag_buffer(sc, pBuffer, return_code,
 	    MPR_FW_DIAG_TYPE_RELEASE);
 	return (status);
 }
 
 static int
 mpr_do_diag_action(struct mpr_softc *sc, uint32_t action, uint8_t *diag_action,
     uint32_t length, uint32_t *return_code)
 {
 	mpr_fw_diag_register_t		diag_register;
 	mpr_fw_diag_unregister_t	diag_unregister;
 	mpr_fw_diag_query_t		diag_query;
 	mpr_diag_read_buffer_t		diag_read_buffer;
 	mpr_fw_diag_release_t		diag_release;
 	int				status = MPR_DIAG_SUCCESS;
 	uint32_t			original_return_code;
 
 	original_return_code = *return_code;
 	*return_code = MPR_FW_DIAG_ERROR_SUCCESS;
 
 	switch (action) {
 		case MPR_FW_DIAG_TYPE_REGISTER:
 			if (!length) {
 				*return_code =
 				    MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPR_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_register,
 			    sizeof(diag_register)) != 0)
 				return (MPR_DIAG_FAILURE);
 			status = mpr_diag_register(sc, &diag_register,
 			    return_code);
 			break;
 
 		case MPR_FW_DIAG_TYPE_UNREGISTER:
 			if (length < sizeof(diag_unregister)) {
 				*return_code =
 				    MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPR_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_unregister,
 			    sizeof(diag_unregister)) != 0)
 				return (MPR_DIAG_FAILURE);
 			status = mpr_diag_unregister(sc, &diag_unregister,
 			    return_code);
 			break;
 
 		case MPR_FW_DIAG_TYPE_QUERY:
 			if (length < sizeof (diag_query)) {
 				*return_code =
 				    MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPR_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_query, sizeof(diag_query))
 			    != 0)
 				return (MPR_DIAG_FAILURE);
 			status = mpr_diag_query(sc, &diag_query, return_code);
 			if (status == MPR_DIAG_SUCCESS)
 				if (copyout(&diag_query, diag_action,
 				    sizeof (diag_query)) != 0)
 					return (MPR_DIAG_FAILURE);
 			break;
 
 		case MPR_FW_DIAG_TYPE_READ_BUFFER:
 			if (copyin(diag_action, &diag_read_buffer,
 			    sizeof(diag_read_buffer)) != 0)
 				return (MPR_DIAG_FAILURE);
 			if (length < diag_read_buffer.BytesToRead) {
 				*return_code =
 				    MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPR_DIAG_FAILURE;
 				break;
 			}
 			status = mpr_diag_read_buffer(sc, &diag_read_buffer,
 			    PTRIN(diag_read_buffer.PtrDataBuffer),
 			    return_code);
 			if (status == MPR_DIAG_SUCCESS) {
 				if (copyout(&diag_read_buffer, diag_action,
 				    sizeof(diag_read_buffer) -
 				    sizeof(diag_read_buffer.PtrDataBuffer)) !=
 				    0)
 					return (MPR_DIAG_FAILURE);
 			}
 			break;
 
 		case MPR_FW_DIAG_TYPE_RELEASE:
 			if (length < sizeof(diag_release)) {
 				*return_code =
 				    MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPR_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_release,
 			    sizeof(diag_release)) != 0)
 				return (MPR_DIAG_FAILURE);
 			status = mpr_diag_release(sc, &diag_release,
 			    return_code);
 			break;
 
 		default:
 			*return_code = MPR_FW_DIAG_ERROR_INVALID_PARAMETER;
 			status = MPR_DIAG_FAILURE;
 			break;
 	}
 
 	if ((status == MPR_DIAG_FAILURE) &&
 	    (original_return_code == MPR_FW_DIAG_NEW) &&
 	    (*return_code != MPR_FW_DIAG_ERROR_SUCCESS))
 		status = MPR_DIAG_SUCCESS;
 
 	return (status);
 }
 
 static int
 mpr_user_diag_action(struct mpr_softc *sc, mpr_diag_action_t *data)
 {
 	int			status;
 
 	/*
 	 * Only allow one diag action at one time.
 	 */
 	if (sc->mpr_flags & MPR_FLAGS_BUSY) {
 		mpr_dprint(sc, MPR_USER, "%s: Only one FW diag command "
 		    "allowed at a single time.", __func__);
 		return (EBUSY);
 	}
 	sc->mpr_flags |= MPR_FLAGS_BUSY;
 
 	/*
 	 * Send diag action request
 	 */
 	if (data->Action == MPR_FW_DIAG_TYPE_REGISTER ||
 	    data->Action == MPR_FW_DIAG_TYPE_UNREGISTER ||
 	    data->Action == MPR_FW_DIAG_TYPE_QUERY ||
 	    data->Action == MPR_FW_DIAG_TYPE_READ_BUFFER ||
 	    data->Action == MPR_FW_DIAG_TYPE_RELEASE) {
 		status = mpr_do_diag_action(sc, data->Action,
 		    PTRIN(data->PtrDiagAction), data->Length,
 		    &data->ReturnCode);
 	} else
 		status = EINVAL;
 
 	sc->mpr_flags &= ~MPR_FLAGS_BUSY;
 	return (status);
 }
 
 /*
  * Copy the event recording mask and the event queue size out.  For
  * clarification, the event recording mask (events_to_record) is not the same
  * thing as the event mask (event_mask).  events_to_record has a bit set for
  * every event type that is to be recorded by the driver, and event_mask has a
  * bit cleared for every event that is allowed into the driver from the IOC.
  * They really have nothing to do with each other.
  */
 static void
 mpr_user_event_query(struct mpr_softc *sc, mpr_event_query_t *data)
 {
 	uint8_t	i;
 
 	mpr_lock(sc);
 	data->Entries = MPR_EVENT_QUEUE_SIZE;
 
 	for (i = 0; i < 4; i++) {
 		data->Types[i] = sc->events_to_record[i];
 	}
 	mpr_unlock(sc);
 }
 
 /*
  * Set the driver's event mask according to what's been given.  See
  * mpr_user_event_query for explanation of the event recording mask and the IOC
  * event mask.  It's the app's responsibility to enable event logging by setting
  * the bits in events_to_record.  Initially, no events will be logged.
  */
 static void
 mpr_user_event_enable(struct mpr_softc *sc, mpr_event_enable_t *data)
 {
 	uint8_t	i;
 
 	mpr_lock(sc);
 	for (i = 0; i < 4; i++) {
 		sc->events_to_record[i] = data->Types[i];
 	}
 	mpr_unlock(sc);
 }
 
 /*
  * Copy out the events that have been recorded, up to the max events allowed.
  */
 static int
 mpr_user_event_report(struct mpr_softc *sc, mpr_event_report_t *data)
 {
 	int		status = 0;
 	uint32_t	size;
 
 	mpr_lock(sc);
 	size = data->Size;
 	if ((size >= sizeof(sc->recorded_events)) && (status == 0)) {
 		mpr_unlock(sc);
 		if (copyout((void *)sc->recorded_events,
 		    PTRIN(data->PtrEvents), size) != 0)
 			status = EFAULT;
 		mpr_lock(sc);
 	} else {
 		/*
 		 * data->Size value is not large enough to copy event data.
 		 */
 		status = EFAULT;
 	}
 
 	/*
 	 * Change size value to match the number of bytes that were copied.
 	 */
 	if (status == 0)
 		data->Size = sizeof(sc->recorded_events);
 	mpr_unlock(sc);
 
 	return (status);
 }
 
 /*
  * Record events into the driver from the IOC if they are not masked.
  */
 void
 mprsas_record_event(struct mpr_softc *sc,
     MPI2_EVENT_NOTIFICATION_REPLY *event_reply)
 {
 	uint32_t	event;
 	int		i, j;
 	uint16_t	event_data_len;
 	boolean_t	sendAEN = FALSE;
 
 	event = event_reply->Event;
 
 	/*
 	 * Generate a system event to let anyone who cares know that a
 	 * LOG_ENTRY_ADDED event has occurred.  This is sent no matter what the
 	 * event mask is set to.
 	 */
 	if (event == MPI2_EVENT_LOG_ENTRY_ADDED) {
 		sendAEN = TRUE;
 	}
 
 	/*
 	 * Record the event only if its corresponding bit is set in
 	 * events_to_record.  event_index is the index into recorded_events and
 	 * event_number is the overall number of an event being recorded since
 	 * start-of-day.  event_index will roll over; event_number will never
 	 * roll over.
 	 */
 	i = (uint8_t)(event / 32);
 	j = (uint8_t)(event % 32);
 	if ((i < 4) && ((1 << j) & sc->events_to_record[i])) {
 		i = sc->event_index;
 		sc->recorded_events[i].Type = event;
 		sc->recorded_events[i].Number = ++sc->event_number;
 		bzero(sc->recorded_events[i].Data, MPR_MAX_EVENT_DATA_LENGTH *
 		    4);
 		event_data_len = event_reply->EventDataLength;
 
 		if (event_data_len > 0) {
 			/*
 			 * Limit data to size in m_event entry
 			 */
 			if (event_data_len > MPR_MAX_EVENT_DATA_LENGTH) {
 				event_data_len = MPR_MAX_EVENT_DATA_LENGTH;
 			}
 			for (j = 0; j < event_data_len; j++) {
 				sc->recorded_events[i].Data[j] =
 				    event_reply->EventData[j];
 			}
 
 			/*
 			 * check for index wrap-around
 			 */
 			if (++i == MPR_EVENT_QUEUE_SIZE) {
 				i = 0;
 			}
 			sc->event_index = (uint8_t)i;
 
 			/*
 			 * Set flag to send the event.
 			 */
 			sendAEN = TRUE;
 		}
 	}
 
 	/*
 	 * Generate a system event if flag is set to let anyone who cares know
 	 * that an event has occurred.
 	 */
 	if (sendAEN) {
 //SLM-how to send a system event (see kqueue, kevent)
 //		(void) ddi_log_sysevent(mpt->m_dip, DDI_VENDOR_LSI, "MPT_SAS",
 //		    "SAS", NULL, NULL, DDI_NOSLEEP);
 	}
 }
 
 static int
 mpr_user_reg_access(struct mpr_softc *sc, mpr_reg_access_t *data)
 {
 	int	status = 0;
 
 	switch (data->Command) {
 		/*
 		 * IO access is not supported.
 		 */
 		case REG_IO_READ:
 		case REG_IO_WRITE:
 			mpr_dprint(sc, MPR_USER, "IO access is not supported. "
 			    "Use memory access.");
 			status = EINVAL;
 			break;
 
 		case REG_MEM_READ:
 			data->RegData = mpr_regread(sc, data->RegOffset);
 			break;
 
 		case REG_MEM_WRITE:
 			mpr_regwrite(sc, data->RegOffset, data->RegData);
 			break;
 
 		default:
 			status = EINVAL;
 			break;
 	}
 
 	return (status);
 }
 
 static int
 mpr_user_btdh(struct mpr_softc *sc, mpr_btdh_mapping_t *data)
 {
 	uint8_t		bt2dh = FALSE;
 	uint8_t		dh2bt = FALSE;
 	uint16_t	dev_handle, bus, target;
 
 	bus = data->Bus;
 	target = data->TargetID;
 	dev_handle = data->DevHandle;
 
 	/*
 	 * When DevHandle is 0xFFFF and Bus/Target are not 0xFFFF, use Bus/
 	 * Target to get DevHandle.  When Bus/Target are 0xFFFF and DevHandle is
 	 * not 0xFFFF, use DevHandle to get Bus/Target.  Anything else is
 	 * invalid.
 	 */
 	if ((bus == 0xFFFF) && (target == 0xFFFF) && (dev_handle != 0xFFFF))
 		dh2bt = TRUE;
 	if ((dev_handle == 0xFFFF) && (bus != 0xFFFF) && (target != 0xFFFF))
 		bt2dh = TRUE;
 	if (!dh2bt && !bt2dh)
 		return (EINVAL);
 
 	/*
 	 * Only handle bus of 0.  Make sure target is within range.
 	 */
 	if (bt2dh) {
 		if (bus != 0)
 			return (EINVAL);
 
 		if (target > sc->max_devices) {
 			mpr_dprint(sc, MPR_XINFO, "Target ID is out of range "
 			   "for Bus/Target to DevHandle mapping.");
 			return (EINVAL);
 		}
 		dev_handle = sc->mapping_table[target].dev_handle;
 		if (dev_handle)
 			data->DevHandle = dev_handle;
 	} else {
 		bus = 0;
 		target = mpr_mapping_get_tid_from_handle(sc, dev_handle);
 		data->Bus = bus;
 		data->TargetID = target;
 	}
 
 	return (0);
 }
 
 static int
 mpr_ioctl(struct cdev *dev, u_long cmd, void *arg, int flag,
     struct thread *td)
 {
 	struct mpr_softc *sc;
 	struct mpr_cfg_page_req *page_req;
 	struct mpr_ext_cfg_page_req *ext_page_req;
 	void *mpr_page;
 	int error, msleep_ret;
 
 	mpr_page = NULL;
 	sc = dev->si_drv1;
 	page_req = (void *)arg;
 	ext_page_req = (void *)arg;
 
 	switch (cmd) {
 	case MPRIO_READ_CFG_HEADER:
 		mpr_lock(sc);
 		error = mpr_user_read_cfg_header(sc, page_req);
 		mpr_unlock(sc);
 		break;
 	case MPRIO_READ_CFG_PAGE:
 		mpr_page = malloc(page_req->len, M_MPRUSER, M_WAITOK | M_ZERO);
 		error = copyin(page_req->buf, mpr_page,
 		    sizeof(MPI2_CONFIG_PAGE_HEADER));
 		if (error)
 			break;
 		mpr_lock(sc);
 		error = mpr_user_read_cfg_page(sc, page_req, mpr_page);
 		mpr_unlock(sc);
 		if (error)
 			break;
 		error = copyout(mpr_page, page_req->buf, page_req->len);
 		break;
 	case MPRIO_READ_EXT_CFG_HEADER:
 		mpr_lock(sc);
 		error = mpr_user_read_extcfg_header(sc, ext_page_req);
 		mpr_unlock(sc);
 		break;
 	case MPRIO_READ_EXT_CFG_PAGE:
 		mpr_page = malloc(ext_page_req->len, M_MPRUSER,
 		    M_WAITOK | M_ZERO);
 		error = copyin(ext_page_req->buf, mpr_page,
 		    sizeof(MPI2_CONFIG_EXTENDED_PAGE_HEADER));
 		if (error)
 			break;
 		mpr_lock(sc);
 		error = mpr_user_read_extcfg_page(sc, ext_page_req, mpr_page);
 		mpr_unlock(sc);
 		if (error)
 			break;
 		error = copyout(mpr_page, ext_page_req->buf, ext_page_req->len);
 		break;
 	case MPRIO_WRITE_CFG_PAGE:
 		mpr_page = malloc(page_req->len, M_MPRUSER, M_WAITOK|M_ZERO);
 		error = copyin(page_req->buf, mpr_page, page_req->len);
 		if (error)
 			break;
 		mpr_lock(sc);
 		error = mpr_user_write_cfg_page(sc, page_req, mpr_page);
 		mpr_unlock(sc);
 		break;
 	case MPRIO_MPR_COMMAND:
 		error = mpr_user_command(sc, (struct mpr_usr_command *)arg);
 		break;
 	case MPTIOCTL_PASS_THRU:
 		/*
 		 * The user has requested to pass through a command to be
 		 * executed by the MPT firmware.  Call our routine which does
 		 * this.  Only allow one passthru IOCTL at one time.
 		 */
 		error = mpr_user_pass_thru(sc, (mpr_pass_thru_t *)arg);
 		break;
 	case MPTIOCTL_GET_ADAPTER_DATA:
 		/*
 		 * The user has requested to read adapter data.  Call our
 		 * routine which does this.
 		 */
 		error = 0;
 		mpr_user_get_adapter_data(sc, (mpr_adapter_data_t *)arg);
 		break;
 	case MPTIOCTL_GET_PCI_INFO:
 		/*
 		 * The user has requested to read pci info.  Call
 		 * our routine which does this.
 		 */
 		mpr_lock(sc);
 		error = 0;
 		mpr_user_read_pci_info(sc, (mpr_pci_info_t *)arg);
 		mpr_unlock(sc);
 		break;
 	case MPTIOCTL_RESET_ADAPTER:
 		mpr_lock(sc);
 		sc->port_enable_complete = 0;
 		uint32_t reinit_start = time_uptime;
 		error = mpr_reinit(sc);
 		/* Sleep for 300 second. */
 		msleep_ret = msleep(&sc->port_enable_complete, &sc->mpr_mtx,
 		    PRIBIO, "mpr_porten", 300 * hz);
 		mpr_unlock(sc);
 		if (msleep_ret)
 			printf("Port Enable did not complete after Diag "
 			    "Reset msleep error %d.\n", msleep_ret);
 		else
 			mpr_dprint(sc, MPR_USER, "Hard Reset with Port Enable "
 			    "completed in %d seconds.\n",
 			    (uint32_t)(time_uptime - reinit_start));
 		break;
 	case MPTIOCTL_DIAG_ACTION:
 		/*
 		 * The user has done a diag buffer action.  Call our routine
 		 * which does this.  Only allow one diag action at one time.
 		 */
 		mpr_lock(sc);
 		error = mpr_user_diag_action(sc, (mpr_diag_action_t *)arg);
 		mpr_unlock(sc);
 		break;
 	case MPTIOCTL_EVENT_QUERY:
 		/*
 		 * The user has done an event query. Call our routine which does
 		 * this.
 		 */
 		error = 0;
 		mpr_user_event_query(sc, (mpr_event_query_t *)arg);
 		break;
 	case MPTIOCTL_EVENT_ENABLE:
 		/*
 		 * The user has done an event enable. Call our routine which
 		 * does this.
 		 */
 		error = 0;
 		mpr_user_event_enable(sc, (mpr_event_enable_t *)arg);
 		break;
 	case MPTIOCTL_EVENT_REPORT:
 		/*
 		 * The user has done an event report. Call our routine which
 		 * does this.
 		 */
 		error = mpr_user_event_report(sc, (mpr_event_report_t *)arg);
 		break;
 	case MPTIOCTL_REG_ACCESS:
 		/*
 		 * The user has requested register access.  Call our routine
 		 * which does this.
 		 */
 		mpr_lock(sc);
 		error = mpr_user_reg_access(sc, (mpr_reg_access_t *)arg);
 		mpr_unlock(sc);
 		break;
 	case MPTIOCTL_BTDH_MAPPING:
 		/*
 		 * The user has requested to translate a bus/target to a
 		 * DevHandle or a DevHandle to a bus/target.  Call our routine
 		 * which does this.
 		 */
 		error = mpr_user_btdh(sc, (mpr_btdh_mapping_t *)arg);
 		break;
 	default:
 		error = ENOIOCTL;
 		break;
 	}
 
 	if (mpr_page != NULL)
 		free(mpr_page, M_MPRUSER);
 
 	return (error);
 }
 
 #ifdef COMPAT_FREEBSD32
 
 struct mpr_cfg_page_req32 {
 	MPI2_CONFIG_PAGE_HEADER header;
 	uint32_t page_address;
 	uint32_t buf;
 	int	len;	
 	uint16_t ioc_status;
 };
 
 struct mpr_ext_cfg_page_req32 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER header;
 	uint32_t page_address;
 	uint32_t buf;
 	int	len;
 	uint16_t ioc_status;
 };
 
 struct mpr_raid_action32 {
 	uint8_t action;
 	uint8_t volume_bus;
 	uint8_t volume_id;
 	uint8_t phys_disk_num;
 	uint32_t action_data_word;
 	uint32_t buf;
 	int len;
 	uint32_t volume_status;
 	uint32_t action_data[4];
 	uint16_t action_status;
 	uint16_t ioc_status;
 	uint8_t write;
 };
 
 struct mpr_usr_command32 {
 	uint32_t req;
 	uint32_t req_len;
 	uint32_t rpl;
 	uint32_t rpl_len;
 	uint32_t buf;
 	int len;
 	uint32_t flags;
 };
 
 #define	MPRIO_READ_CFG_HEADER32	_IOWR('M', 200, struct mpr_cfg_page_req32)
 #define	MPRIO_READ_CFG_PAGE32	_IOWR('M', 201, struct mpr_cfg_page_req32)
 #define	MPRIO_READ_EXT_CFG_HEADER32 _IOWR('M', 202, struct mpr_ext_cfg_page_req32)
 #define	MPRIO_READ_EXT_CFG_PAGE32 _IOWR('M', 203, struct mpr_ext_cfg_page_req32)
 #define	MPRIO_WRITE_CFG_PAGE32	_IOWR('M', 204, struct mpr_cfg_page_req32)
 #define	MPRIO_RAID_ACTION32	_IOWR('M', 205, struct mpr_raid_action32)
 #define	MPRIO_MPR_COMMAND32	_IOWR('M', 210, struct mpr_usr_command32)
 
 static int
 mpr_ioctl32(struct cdev *dev, u_long cmd32, void *_arg, int flag,
     struct thread *td)
 {
 	struct mpr_cfg_page_req32 *page32 = _arg;
 	struct mpr_ext_cfg_page_req32 *ext32 = _arg;
 	struct mpr_raid_action32 *raid32 = _arg;
 	struct mpr_usr_command32 *user32 = _arg;
 	union {
 		struct mpr_cfg_page_req page;
 		struct mpr_ext_cfg_page_req ext;
 		struct mpr_raid_action raid;
 		struct mpr_usr_command user;
 	} arg;
 	u_long cmd;
 	int error;
 
 	switch (cmd32) {
 	case MPRIO_READ_CFG_HEADER32:
 	case MPRIO_READ_CFG_PAGE32:
 	case MPRIO_WRITE_CFG_PAGE32:
 		if (cmd32 == MPRIO_READ_CFG_HEADER32)
 			cmd = MPRIO_READ_CFG_HEADER;
 		else if (cmd32 == MPRIO_READ_CFG_PAGE32)
 			cmd = MPRIO_READ_CFG_PAGE;
 		else
 			cmd = MPRIO_WRITE_CFG_PAGE;
 		CP(*page32, arg.page, header);
 		CP(*page32, arg.page, page_address);
 		PTRIN_CP(*page32, arg.page, buf);
 		CP(*page32, arg.page, len);
 		CP(*page32, arg.page, ioc_status);
 		break;
 
 	case MPRIO_READ_EXT_CFG_HEADER32:
 	case MPRIO_READ_EXT_CFG_PAGE32:
 		if (cmd32 == MPRIO_READ_EXT_CFG_HEADER32)
 			cmd = MPRIO_READ_EXT_CFG_HEADER;
 		else
 			cmd = MPRIO_READ_EXT_CFG_PAGE;
 		CP(*ext32, arg.ext, header);
 		CP(*ext32, arg.ext, page_address);
 		PTRIN_CP(*ext32, arg.ext, buf);
 		CP(*ext32, arg.ext, len);
 		CP(*ext32, arg.ext, ioc_status);
 		break;
 
 	case MPRIO_RAID_ACTION32:
 		cmd = MPRIO_RAID_ACTION;
 		CP(*raid32, arg.raid, action);
 		CP(*raid32, arg.raid, volume_bus);
 		CP(*raid32, arg.raid, volume_id);
 		CP(*raid32, arg.raid, phys_disk_num);
 		CP(*raid32, arg.raid, action_data_word);
 		PTRIN_CP(*raid32, arg.raid, buf);
 		CP(*raid32, arg.raid, len);
 		CP(*raid32, arg.raid, volume_status);
 		bcopy(raid32->action_data, arg.raid.action_data,
 		    sizeof arg.raid.action_data);
 		CP(*raid32, arg.raid, ioc_status);
 		CP(*raid32, arg.raid, write);
 		break;
 
 	case MPRIO_MPR_COMMAND32:
 		cmd = MPRIO_MPR_COMMAND;
 		PTRIN_CP(*user32, arg.user, req);
 		CP(*user32, arg.user, req_len);
 		PTRIN_CP(*user32, arg.user, rpl);
 		CP(*user32, arg.user, rpl_len);
 		PTRIN_CP(*user32, arg.user, buf);
 		CP(*user32, arg.user, len);
 		CP(*user32, arg.user, flags);
 		break;
 	default:
 		return (ENOIOCTL);
 	}
 
 	error = mpr_ioctl(dev, cmd, &arg, flag, td);
 	if (error == 0 && (cmd32 & IOC_OUT) != 0) {
 		switch (cmd32) {
 		case MPRIO_READ_CFG_HEADER32:
 		case MPRIO_READ_CFG_PAGE32:
 		case MPRIO_WRITE_CFG_PAGE32:
 			CP(arg.page, *page32, header);
 			CP(arg.page, *page32, page_address);
 			PTROUT_CP(arg.page, *page32, buf);
 			CP(arg.page, *page32, len);
 			CP(arg.page, *page32, ioc_status);
 			break;
 
 		case MPRIO_READ_EXT_CFG_HEADER32:
 		case MPRIO_READ_EXT_CFG_PAGE32:
 			CP(arg.ext, *ext32, header);
 			CP(arg.ext, *ext32, page_address);
 			PTROUT_CP(arg.ext, *ext32, buf);
 			CP(arg.ext, *ext32, len);
 			CP(arg.ext, *ext32, ioc_status);
 			break;
 
 		case MPRIO_RAID_ACTION32:
 			CP(arg.raid, *raid32, action);
 			CP(arg.raid, *raid32, volume_bus);
 			CP(arg.raid, *raid32, volume_id);
 			CP(arg.raid, *raid32, phys_disk_num);
 			CP(arg.raid, *raid32, action_data_word);
 			PTROUT_CP(arg.raid, *raid32, buf);
 			CP(arg.raid, *raid32, len);
 			CP(arg.raid, *raid32, volume_status);
 			bcopy(arg.raid.action_data, raid32->action_data,
 			    sizeof arg.raid.action_data);
 			CP(arg.raid, *raid32, ioc_status);
 			CP(arg.raid, *raid32, write);
 			break;
 
 		case MPRIO_MPR_COMMAND32:
 			PTROUT_CP(arg.user, *user32, req);
 			CP(arg.user, *user32, req_len);
 			PTROUT_CP(arg.user, *user32, rpl);
 			CP(arg.user, *user32, rpl_len);
 			PTROUT_CP(arg.user, *user32, buf);
 			CP(arg.user, *user32, len);
 			CP(arg.user, *user32, flags);
 			break;
 		}
 	}
 
 	return (error);
 }
 #endif /* COMPAT_FREEBSD32 */
 
 static int
 mpr_ioctl_devsw(struct cdev *dev, u_long com, caddr_t arg, int flag,
     struct thread *td)
 {
 #ifdef COMPAT_FREEBSD32
 	if (SV_CURPROC_FLAG(SV_ILP32))
 		return (mpr_ioctl32(dev, com, arg, flag, td));
 #endif
 	return (mpr_ioctl(dev, com, arg, flag, td));
 }
Index: head/sys/dev/mps/mps.c
===================================================================
--- head/sys/dev/mps/mps.c	(revision 365705)
+++ head/sys/dev/mps/mps.c	(revision 365706)
@@ -1,3240 +1,3235 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2009 Yahoo! Inc.
  * Copyright (c) 2011-2015 LSI Corp.
  * Copyright (c) 2013-2015 Avago Technologies
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Avago Technologies (LSI) MPT-Fusion Host Adapter FreeBSD
  *
  * $FreeBSD$
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* Communications core for Avago Technologies (LSI) MPT2 */
 
 /* TODO Move headers to mpsvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/selinfo.h>
 #include <sys/lock.h>
 #include <sys/mutex.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/bio.h>
 #include <sys/malloc.h>
 #include <sys/uio.h>
 #include <sys/sysctl.h>
 #include <sys/smp.h>
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <sys/taskqueue.h>
 #include <sys/endian.h>
 #include <sys/eventhandler.h>
 #include <sys/sbuf.h>
 #include <sys/priv.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 #include <sys/proc.h>
 
 #include <dev/pci/pcivar.h>
 
 #include <cam/cam.h>
 #include <cam/scsi/scsi_all.h>
 
 #include <dev/mps/mpi/mpi2_type.h>
 #include <dev/mps/mpi/mpi2.h>
 #include <dev/mps/mpi/mpi2_ioc.h>
 #include <dev/mps/mpi/mpi2_sas.h>
 #include <dev/mps/mpi/mpi2_cnfg.h>
 #include <dev/mps/mpi/mpi2_init.h>
 #include <dev/mps/mpi/mpi2_tool.h>
 #include <dev/mps/mps_ioctl.h>
 #include <dev/mps/mpsvar.h>
 #include <dev/mps/mps_table.h>
 
 static int mps_diag_reset(struct mps_softc *sc, int sleep_flag);
 static int mps_init_queues(struct mps_softc *sc);
 static void mps_resize_queues(struct mps_softc *sc);
 static int mps_message_unit_reset(struct mps_softc *sc, int sleep_flag);
 static int mps_transition_operational(struct mps_softc *sc);
 static int mps_iocfacts_allocate(struct mps_softc *sc, uint8_t attaching);
 static void mps_iocfacts_free(struct mps_softc *sc);
 static void mps_startup(void *arg);
 static int mps_send_iocinit(struct mps_softc *sc);
 static int mps_alloc_queues(struct mps_softc *sc);
 static int mps_alloc_hw_queues(struct mps_softc *sc);
 static int mps_alloc_replies(struct mps_softc *sc);
 static int mps_alloc_requests(struct mps_softc *sc);
 static int mps_attach_log(struct mps_softc *sc);
 static __inline void mps_complete_command(struct mps_softc *sc,
     struct mps_command *cm);
 static void mps_dispatch_event(struct mps_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *reply);
 static void mps_config_complete(struct mps_softc *sc, struct mps_command *cm);
 static void mps_periodic(void *);
 static int mps_reregister_events(struct mps_softc *sc);
 static void mps_enqueue_request(struct mps_softc *sc, struct mps_command *cm);
 static int mps_get_iocfacts(struct mps_softc *sc, MPI2_IOC_FACTS_REPLY *facts);
 static int mps_wait_db_ack(struct mps_softc *sc, int timeout, int sleep_flag);
 static int mps_debug_sysctl(SYSCTL_HANDLER_ARGS);
 static int mps_dump_reqs(SYSCTL_HANDLER_ARGS);
 static void mps_parse_debug(struct mps_softc *sc, char *list);
 
 SYSCTL_NODE(_hw, OID_AUTO, mps, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
     "MPS Driver Parameters");
 
 MALLOC_DEFINE(M_MPT2, "mps", "mpt2 driver memory");
 MALLOC_DECLARE(M_MPSUSER);
 
 /*
  * Do a "Diagnostic Reset" aka a hard reset.  This should get the chip out of
  * any state and back to its initialization state machine.
  */
 static char mpt2_reset_magic[] = { 0x00, 0x0f, 0x04, 0x0b, 0x02, 0x07, 0x0d };
 
 /* Added this union to smoothly convert le64toh cm->cm_desc.Words.
  * Compiler only support unint64_t to be passed as argument.
  * Otherwise it will throw below error
  * "aggregate value used where an integer was expected"
  */
 
 typedef union _reply_descriptor {
         u64 word;
         struct {
                 u32 low;
                 u32 high;
         } u;
 }reply_descriptor,address_descriptor;
 
 /* Rate limit chain-fail messages to 1 per minute */
 static struct timeval mps_chainfail_interval = { 60, 0 };
 
 /* 
  * sleep_flag can be either CAN_SLEEP or NO_SLEEP.
  * If this function is called from process context, it can sleep
  * and there is no harm to sleep, in case if this fuction is called
  * from Interrupt handler, we can not sleep and need NO_SLEEP flag set.
  * based on sleep flags driver will call either msleep, pause or DELAY.
  * msleep and pause are of same variant, but pause is used when mps_mtx
  * is not hold by driver.
  *
  */
 static int
 mps_diag_reset(struct mps_softc *sc,int sleep_flag)
 {
 	uint32_t reg;
 	int i, error, tries = 0;
 	uint8_t first_wait_done = FALSE;
 
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	/* Clear any pending interrupts */
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/*
 	 * Force NO_SLEEP for threads prohibited to sleep
  	 * e.a Thread from interrupt handler are prohibited to sleep.
  	 */
 	if (curthread->td_no_sleeping != 0)
 		sleep_flag = NO_SLEEP;
 
 	mps_dprint(sc, MPS_INIT, "sequence start, sleep_flag= %d\n", sleep_flag);
 
 	/* Push the magic sequence */
 	error = ETIMEDOUT;
 	while (tries++ < 20) {
 		for (i = 0; i < sizeof(mpt2_reset_magic); i++)
 			mps_regwrite(sc, MPI2_WRITE_SEQUENCE_OFFSET,
 			    mpt2_reset_magic[i]);
 		/* wait 100 msec */
 		if (mtx_owned(&sc->mps_mtx) && sleep_flag == CAN_SLEEP)
 			msleep(&sc->msleep_fake_chan, &sc->mps_mtx, 0,
 			    "mpsdiag", hz/10);
 		else if (sleep_flag == CAN_SLEEP)
 			pause("mpsdiag", hz/10);
 		else
 			DELAY(100 * 1000);
 
 		reg = mps_regread(sc, MPI2_HOST_DIAGNOSTIC_OFFSET);
 		if (reg & MPI2_DIAG_DIAG_WRITE_ENABLE) {
 			error = 0;
 			break;
 		}
 	}
 	if (error) {
 		mps_dprint(sc, MPS_INIT, "sequence failed, error=%d, exit\n",
 		    error);
 		return (error);
 	}
 
 	/* Send the actual reset.  XXX need to refresh the reg? */
 	reg |= MPI2_DIAG_RESET_ADAPTER;
 	mps_dprint(sc, MPS_INIT, "sequence success, sending reset, reg= 0x%x\n",
 		reg);
 	mps_regwrite(sc, MPI2_HOST_DIAGNOSTIC_OFFSET, reg);
 
 	/* Wait up to 300 seconds in 50ms intervals */
 	error = ETIMEDOUT;
 	for (i = 0; i < 6000; i++) {
 		/*
 		 * Wait 50 msec. If this is the first time through, wait 256
 		 * msec to satisfy Diag Reset timing requirements.
 		 */
 		if (first_wait_done) {
 			if (mtx_owned(&sc->mps_mtx) && sleep_flag == CAN_SLEEP)
 				msleep(&sc->msleep_fake_chan, &sc->mps_mtx, 0,
 				    "mpsdiag", hz/20);
 			else if (sleep_flag == CAN_SLEEP)
 				pause("mpsdiag", hz/20);
 			else
 				DELAY(50 * 1000);
 		} else {
 			DELAY(256 * 1000);
 			first_wait_done = TRUE;
 		}
 		/*
 		 * Check for the RESET_ADAPTER bit to be cleared first, then
 		 * wait for the RESET state to be cleared, which takes a little
 		 * longer.
 		 */
 		reg = mps_regread(sc, MPI2_HOST_DIAGNOSTIC_OFFSET);
 		if (reg & MPI2_DIAG_RESET_ADAPTER) {
 			continue;
 		}
 		reg = mps_regread(sc, MPI2_DOORBELL_OFFSET);
 		if ((reg & MPI2_IOC_STATE_MASK) != MPI2_IOC_STATE_RESET) {
 			error = 0;
 			break;
 		}
 	}
 	if (error) {
 		mps_dprint(sc, MPS_INIT, "reset failed, error= %d, exit\n",
 		    error);
 		return (error);
 	}
 
 	mps_regwrite(sc, MPI2_WRITE_SEQUENCE_OFFSET, 0x0);
 	mps_dprint(sc, MPS_INIT, "diag reset success, exit\n");
 
 	return (0);
 }
 
 static int
 mps_message_unit_reset(struct mps_softc *sc, int sleep_flag)
 {
 	int error;
 
 	MPS_FUNCTRACE(sc);
 
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	error = 0;
 	mps_regwrite(sc, MPI2_DOORBELL_OFFSET,
 	    MPI2_FUNCTION_IOC_MESSAGE_UNIT_RESET <<
 	    MPI2_DOORBELL_FUNCTION_SHIFT);
 
 	if (mps_wait_db_ack(sc, 5, sleep_flag) != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT,
 		    "Doorbell handshake failed\n");
 		error = ETIMEDOUT;
 	}
 
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 	return (error);
 }
 
 static int
 mps_transition_ready(struct mps_softc *sc)
 {
 	uint32_t reg, state;
 	int error, tries = 0;
 	int sleep_flags;
 
 	MPS_FUNCTRACE(sc);
 	/* If we are in attach call, do not sleep */
 	sleep_flags = (sc->mps_flags & MPS_FLAGS_ATTACH_DONE)
 					? CAN_SLEEP:NO_SLEEP;
 	error = 0;
 
 	mps_dprint(sc, MPS_INIT, "%s entered, sleep_flags= %d\n",
 	   __func__, sleep_flags);
 
 	while (tries++ < 1200) {
 		reg = mps_regread(sc, MPI2_DOORBELL_OFFSET);
 		mps_dprint(sc, MPS_INIT, "  Doorbell= 0x%x\n", reg);
 
 		/*
 		 * Ensure the IOC is ready to talk.  If it's not, try
 		 * resetting it.
 		 */
 		if (reg & MPI2_DOORBELL_USED) {
 			mps_dprint(sc, MPS_INIT, "  Not ready, sending diag "
 			    "reset\n");
 			mps_diag_reset(sc, sleep_flags);
 			DELAY(50000);
 			continue;
 		}
 
 		/* Is the adapter owned by another peer? */
 		if ((reg & MPI2_DOORBELL_WHO_INIT_MASK) ==
 		    (MPI2_WHOINIT_PCI_PEER << MPI2_DOORBELL_WHO_INIT_SHIFT)) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, "IOC is under the "
 			    "control of another peer host, aborting "
 			    "initialization.\n");
 			error = ENXIO;
 			break;
 		}
 		
 		state = reg & MPI2_IOC_STATE_MASK;
 		if (state == MPI2_IOC_STATE_READY) {
 			/* Ready to go! */
 			error = 0;
 			break;
 		} else if (state == MPI2_IOC_STATE_FAULT) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, "IOC in fault "
 			    "state 0x%x, resetting\n",
 			    state & MPI2_DOORBELL_FAULT_CODE_MASK);
 			mps_diag_reset(sc, sleep_flags);
 		} else if (state == MPI2_IOC_STATE_OPERATIONAL) {
 			/* Need to take ownership */
 			mps_message_unit_reset(sc, sleep_flags);
 		} else if (state == MPI2_IOC_STATE_RESET) {
 			/* Wait a bit, IOC might be in transition */
 			mps_dprint(sc, MPS_INIT|MPS_FAULT,
 			    "IOC in unexpected reset state\n");
 		} else {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT,
 			    "IOC in unknown state 0x%x\n", state);
 			error = EINVAL;
 			break;
 		}
 
 		/* Wait 50ms for things to settle down. */
 		DELAY(50000);
 	}
 
 	if (error)
 		mps_dprint(sc, MPS_INIT|MPS_FAULT,
 		    "Cannot transition IOC to ready\n");
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 
 	return (error);
 }
 
 static int
 mps_transition_operational(struct mps_softc *sc)
 {
 	uint32_t reg, state;
 	int error;
 
 	MPS_FUNCTRACE(sc);
 
 	error = 0;
 	reg = mps_regread(sc, MPI2_DOORBELL_OFFSET);
 	mps_dprint(sc, MPS_INIT, "%s entered, Doorbell= 0x%x\n", __func__, reg);
 
 	state = reg & MPI2_IOC_STATE_MASK;
 	if (state != MPI2_IOC_STATE_READY) {
 		mps_dprint(sc, MPS_INIT, "IOC not ready\n");
 		if ((error = mps_transition_ready(sc)) != 0) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, 
 			    "failed to transition ready, exit\n");
 			return (error);
 		}
 	}
 
 	error = mps_send_iocinit(sc);
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 
 	return (error);
 }
 
 static void
 mps_resize_queues(struct mps_softc *sc)
 {
 	u_int reqcr, prireqcr, maxio, sges_per_frame;
 
 	/*
 	 * Size the queues. Since the reply queues always need one free
 	 * entry, we'll deduct one reply message here.  The LSI documents
 	 * suggest instead to add a count to the request queue, but I think
 	 * that it's better to deduct from reply queue.
 	 */
 	prireqcr = MAX(1, sc->max_prireqframes);
 	prireqcr = MIN(prireqcr, sc->facts->HighPriorityCredit);
 
 	reqcr = MAX(2, sc->max_reqframes);
 	reqcr = MIN(reqcr, sc->facts->RequestCredit);
 
 	sc->num_reqs = prireqcr + reqcr;
 	sc->num_prireqs = prireqcr;
 	sc->num_replies = MIN(sc->max_replyframes + sc->max_evtframes,
 	    sc->facts->MaxReplyDescriptorPostQueueDepth) - 1;
 
 	/* Store the request frame size in bytes rather than as 32bit words */
 	sc->reqframesz = sc->facts->IOCRequestFrameSize * 4;
 
 	/*
 	 * Max IO Size is Page Size * the following:
 	 * ((SGEs per frame - 1 for chain element) * Max Chain Depth)
 	 * + 1 for no chain needed in last frame
 	 *
 	 * If user suggests a Max IO size to use, use the smaller of the
 	 * user's value and the calculated value as long as the user's
 	 * value is larger than 0. The user's value is in pages.
 	 */
 	sges_per_frame = sc->reqframesz / sizeof(MPI2_SGE_SIMPLE64) - 1;
 	maxio = (sges_per_frame * sc->facts->MaxChainDepth + 1) * PAGE_SIZE;
 
 	/*
 	 * If I/O size limitation requested, then use it and pass up to CAM.
 	 * If not, use MAXPHYS as an optimization hint, but report HW limit.
 	 */
 	if (sc->max_io_pages > 0) {
 		maxio = min(maxio, sc->max_io_pages * PAGE_SIZE);
 		sc->maxio = maxio;
 	} else {
 		sc->maxio = maxio;
 		maxio = min(maxio, MAXPHYS);
 	}
 
 	sc->num_chains = (maxio / PAGE_SIZE + sges_per_frame - 2) /
 	    sges_per_frame * reqcr;
 	if (sc->max_chains > 0 && sc->max_chains < sc->num_chains)
 		sc->num_chains = sc->max_chains;
 
 	/*
 	 * Figure out the number of MSIx-based queues.  If the firmware or
 	 * user has done something crazy and not allowed enough credit for
 	 * the queues to be useful then don't enable multi-queue.
 	 */
 	if (sc->facts->MaxMSIxVectors < 2)
 		sc->msi_msgs = 1;
 
 	if (sc->msi_msgs > 1) {
 		sc->msi_msgs = MIN(sc->msi_msgs, mp_ncpus);
 		sc->msi_msgs = MIN(sc->msi_msgs, sc->facts->MaxMSIxVectors);
 		if (sc->num_reqs / sc->msi_msgs < 2)
 			sc->msi_msgs = 1;
 	}
 
 	mps_dprint(sc, MPS_INIT, "Sized queues to q=%d reqs=%d replies=%d\n",
 	    sc->msi_msgs, sc->num_reqs, sc->num_replies);
 }
 
 /*
  * This is called during attach and when re-initializing due to a Diag Reset.
  * IOC Facts is used to allocate many of the structures needed by the driver.
  * If called from attach, de-allocation is not required because the driver has
  * not allocated any structures yet, but if called from a Diag Reset, previously
  * allocated structures based on IOC Facts will need to be freed and re-
  * allocated bases on the latest IOC Facts.
  */
 static int
 mps_iocfacts_allocate(struct mps_softc *sc, uint8_t attaching)
 {
 	int error;
 	Mpi2IOCFactsReply_t saved_facts;
 	uint8_t saved_mode, reallocating;
 
 	mps_dprint(sc, MPS_INIT|MPS_TRACE, "%s entered\n", __func__);
 
 	/* Save old IOC Facts and then only reallocate if Facts have changed */
 	if (!attaching) {
 		bcopy(sc->facts, &saved_facts, sizeof(MPI2_IOC_FACTS_REPLY));
 	}
 
 	/*
 	 * Get IOC Facts.  In all cases throughout this function, panic if doing
 	 * a re-initialization and only return the error if attaching so the OS
 	 * can handle it.
 	 */
 	if ((error = mps_get_iocfacts(sc, sc->facts)) != 0) {
 		if (attaching) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, "Failed to get "
 			    "IOC Facts with error %d, exit\n", error);
 			return (error);
 		} else {
 			panic("%s failed to get IOC Facts with error %d\n",
 			    __func__, error);
 		}
 	}
 
 	MPS_DPRINT_PAGE(sc, MPS_XINFO, iocfacts, sc->facts);
 
 	snprintf(sc->fw_version, sizeof(sc->fw_version), 
 	    "%02d.%02d.%02d.%02d", 
 	    sc->facts->FWVersion.Struct.Major,
 	    sc->facts->FWVersion.Struct.Minor,
 	    sc->facts->FWVersion.Struct.Unit,
 	    sc->facts->FWVersion.Struct.Dev);
 
 	snprintf(sc->msg_version, sizeof(sc->msg_version), "%d.%d",
 	    (sc->facts->MsgVersion & MPI2_IOCFACTS_MSGVERSION_MAJOR_MASK) >>
 	    MPI2_IOCFACTS_MSGVERSION_MAJOR_SHIFT, 
 	    (sc->facts->MsgVersion & MPI2_IOCFACTS_MSGVERSION_MINOR_MASK) >>
 	    MPI2_IOCFACTS_MSGVERSION_MINOR_SHIFT);
 
 	mps_dprint(sc, MPS_INFO, "Firmware: %s, Driver: %s\n", sc->fw_version,
 	    MPS_DRIVER_VERSION);
 	mps_dprint(sc, MPS_INFO, "IOCCapabilities: %b\n",
 	     sc->facts->IOCCapabilities,
 	    "\20" "\3ScsiTaskFull" "\4DiagTrace" "\5SnapBuf" "\6ExtBuf"
 	    "\7EEDP" "\10BiDirTarg" "\11Multicast" "\14TransRetry" "\15IR"
 	    "\16EventReplay" "\17RaidAccel" "\20MSIXIndex" "\21HostDisc");
 
 	/*
 	 * If the chip doesn't support event replay then a hard reset will be
 	 * required to trigger a full discovery.  Do the reset here then
 	 * retransition to Ready.  A hard reset might have already been done,
 	 * but it doesn't hurt to do it again.  Only do this if attaching, not
 	 * for a Diag Reset.
 	 */
 	if (attaching && ((sc->facts->IOCCapabilities &
 	    MPI2_IOCFACTS_CAPABILITY_EVENT_REPLAY) == 0)) {
 		mps_dprint(sc, MPS_INIT, "No event replay, reseting\n");
 		mps_diag_reset(sc, NO_SLEEP);
 		if ((error = mps_transition_ready(sc)) != 0) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, "Failed to "
 			    "transition to ready with error %d, exit\n",
 			    error);
 			return (error);
 		}
 	}
 
 	/*
 	 * Set flag if IR Firmware is loaded.  If the RAID Capability has
 	 * changed from the previous IOC Facts, log a warning, but only if
 	 * checking this after a Diag Reset and not during attach.
 	 */
 	saved_mode = sc->ir_firmware;
 	if (sc->facts->IOCCapabilities &
 	    MPI2_IOCFACTS_CAPABILITY_INTEGRATED_RAID)
 		sc->ir_firmware = 1;
 	if (!attaching) {
 		if (sc->ir_firmware != saved_mode) {
 			mps_dprint(sc, MPS_INIT|MPS_FAULT, "new IR/IT mode "
 			    "in IOC Facts does not match previous mode\n");
 		}
 	}
 
 	/* Only deallocate and reallocate if relevant IOC Facts have changed */
 	reallocating = FALSE;
 	sc->mps_flags &= ~MPS_FLAGS_REALLOCATED;
 
 	if ((!attaching) &&
 	    ((saved_facts.MsgVersion != sc->facts->MsgVersion) ||
 	    (saved_facts.HeaderVersion != sc->facts->HeaderVersion) ||
 	    (saved_facts.MaxChainDepth != sc->facts->MaxChainDepth) ||
 	    (saved_facts.RequestCredit != sc->facts->RequestCredit) ||
 	    (saved_facts.ProductID != sc->facts->ProductID) ||
 	    (saved_facts.IOCCapabilities != sc->facts->IOCCapabilities) ||
 	    (saved_facts.IOCRequestFrameSize !=
 	    sc->facts->IOCRequestFrameSize) ||
 	    (saved_facts.MaxTargets != sc->facts->MaxTargets) ||
 	    (saved_facts.MaxSasExpanders != sc->facts->MaxSasExpanders) ||
 	    (saved_facts.MaxEnclosures != sc->facts->MaxEnclosures) ||
 	    (saved_facts.HighPriorityCredit != sc->facts->HighPriorityCredit) ||
 	    (saved_facts.MaxReplyDescriptorPostQueueDepth !=
 	    sc->facts->MaxReplyDescriptorPostQueueDepth) ||
 	    (saved_facts.ReplyFrameSize != sc->facts->ReplyFrameSize) ||
 	    (saved_facts.MaxVolumes != sc->facts->MaxVolumes) ||
 	    (saved_facts.MaxPersistentEntries !=
 	    sc->facts->MaxPersistentEntries))) {
 		reallocating = TRUE;
 
 		/* Record that we reallocated everything */
 		sc->mps_flags |= MPS_FLAGS_REALLOCATED;
 	}
 
 	/*
 	 * Some things should be done if attaching or re-allocating after a Diag
 	 * Reset, but are not needed after a Diag Reset if the FW has not
 	 * changed.
 	 */
 	if (attaching || reallocating) {
 		/*
 		 * Check if controller supports FW diag buffers and set flag to
 		 * enable each type.
 		 */
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_DIAG_TRACE_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_TRACE].
 			    enabled = TRUE;
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_SNAPSHOT_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_SNAPSHOT].
 			    enabled = TRUE;
 		if (sc->facts->IOCCapabilities &
 		    MPI2_IOCFACTS_CAPABILITY_EXTENDED_BUFFER)
 			sc->fw_diag_buffer_list[MPI2_DIAG_BUF_TYPE_EXTENDED].
 			    enabled = TRUE;
 
 		/*
 		 * Set flag if EEDP is supported and if TLR is supported.
 		 */
 		if (sc->facts->IOCCapabilities & MPI2_IOCFACTS_CAPABILITY_EEDP)
 			sc->eedp_enabled = TRUE;
 		if (sc->facts->IOCCapabilities & MPI2_IOCFACTS_CAPABILITY_TLR)
 			sc->control_TLR = TRUE;
 
 		mps_resize_queues(sc);
 
 		/*
 		 * Initialize all Tail Queues
 		 */
 		TAILQ_INIT(&sc->req_list);
 		TAILQ_INIT(&sc->high_priority_req_list);
 		TAILQ_INIT(&sc->chain_list);
 		TAILQ_INIT(&sc->tm_list);
 	}
 
 	/*
 	 * If doing a Diag Reset and the FW is significantly different
 	 * (reallocating will be set above in IOC Facts comparison), then all
 	 * buffers based on the IOC Facts will need to be freed before they are
 	 * reallocated.
 	 */
 	if (reallocating) {
 		mps_iocfacts_free(sc);
 		mpssas_realloc_targets(sc, saved_facts.MaxTargets +
 		    saved_facts.MaxVolumes);
 	}
 
 	/*
 	 * Any deallocation has been completed.  Now start reallocating
 	 * if needed.  Will only need to reallocate if attaching or if the new
 	 * IOC Facts are different from the previous IOC Facts after a Diag
 	 * Reset. Targets have already been allocated above if needed.
 	 */
 	error = 0;
 	while (attaching || reallocating) {
 		if ((error = mps_alloc_hw_queues(sc)) != 0)
 			break;
 		if ((error = mps_alloc_replies(sc)) != 0)
 			break;
 		if ((error = mps_alloc_requests(sc)) != 0)
 			break;
 		if ((error = mps_alloc_queues(sc)) != 0)
 			break;
 
 		break;
 	}
 	if (error) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT,
 		    "Failed to alloc queues with error %d\n", error);
 		mps_free(sc);
 		return (error);
 	}
 
 	/* Always initialize the queues */
 	bzero(sc->free_queue, sc->fqdepth * 4);
 	mps_init_queues(sc);
 
 	/*
 	 * Always get the chip out of the reset state, but only panic if not
 	 * attaching.  If attaching and there is an error, that is handled by
 	 * the OS.
 	 */
 	error = mps_transition_operational(sc);
 	if (error != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "Failed to "
 		    "transition to operational with error %d\n", error);
 		mps_free(sc);
 		return (error);
 	}
 
 	/*
 	 * Finish the queue initialization.
 	 * These are set here instead of in mps_init_queues() because the
 	 * IOC resets these values during the state transition in
 	 * mps_transition_operational().  The free index is set to 1
 	 * because the corresponding index in the IOC is set to 0, and the
 	 * IOC treats the queues as full if both are set to the same value.
 	 * Hence the reason that the queue can't hold all of the possible
 	 * replies.
 	 */
 	sc->replypostindex = 0;
 	mps_regwrite(sc, MPI2_REPLY_FREE_HOST_INDEX_OFFSET, sc->replyfreeindex);
 	mps_regwrite(sc, MPI2_REPLY_POST_HOST_INDEX_OFFSET, 0);
 
 	/*
 	 * Attach the subsystems so they can prepare their event masks.
 	 * XXX Should be dynamic so that IM/IR and user modules can attach
 	 */
 	error = 0;
 	while (attaching) {
 		mps_dprint(sc, MPS_INIT, "Attaching subsystems\n");
 		if ((error = mps_attach_log(sc)) != 0)
 			break;
 		if ((error = mps_attach_sas(sc)) != 0)
 			break;
 		if ((error = mps_attach_user(sc)) != 0)
 			break;
 		break;
 	}
 	if (error) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "Failed to attach all "
 		    "subsystems: error %d\n", error);
 		mps_free(sc);
 		return (error);
 	}
 
 	/*
 	 * XXX If the number of MSI-X vectors changes during re-init, this
 	 * won't see it and adjust.
 	 */
 	if (attaching && (error = mps_pci_setup_interrupts(sc)) != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "Failed to setup "
 		    "interrupts\n");
 		mps_free(sc);
 		return (error);
 	}
 
 	/*
 	 * Set flag if this is a WD controller.  This shouldn't ever change, but
 	 * reset it after a Diag Reset, just in case.
 	 */
 	sc->WD_available = FALSE;
 	if (pci_get_device(sc->mps_dev) == MPI2_MFGPAGE_DEVID_SSS6200)
 		sc->WD_available = TRUE;
 
 	return (error);
 }
 
 /*
  * This is called if memory is being free (during detach for example) and when
  * buffers need to be reallocated due to a Diag Reset.
  */
 static void
 mps_iocfacts_free(struct mps_softc *sc)
 {
 	struct mps_command *cm;
 	int i;
 
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	if (sc->free_busaddr != 0)
 		bus_dmamap_unload(sc->queues_dmat, sc->queues_map);
 	if (sc->free_queue != NULL)
 		bus_dmamem_free(sc->queues_dmat, sc->free_queue,
 		    sc->queues_map);
 	if (sc->queues_dmat != NULL)
 		bus_dma_tag_destroy(sc->queues_dmat);
 
 	if (sc->chain_frames != NULL) {
 		bus_dmamap_unload(sc->chain_dmat, sc->chain_map);
 		bus_dmamem_free(sc->chain_dmat, sc->chain_frames,
 		    sc->chain_map);
 	}
 	if (sc->chain_dmat != NULL)
 		bus_dma_tag_destroy(sc->chain_dmat);
 
 	if (sc->sense_busaddr != 0)
 		bus_dmamap_unload(sc->sense_dmat, sc->sense_map);
 	if (sc->sense_frames != NULL)
 		bus_dmamem_free(sc->sense_dmat, sc->sense_frames,
 		    sc->sense_map);
 	if (sc->sense_dmat != NULL)
 		bus_dma_tag_destroy(sc->sense_dmat);
 
 	if (sc->reply_busaddr != 0)
 		bus_dmamap_unload(sc->reply_dmat, sc->reply_map);
 	if (sc->reply_frames != NULL)
 		bus_dmamem_free(sc->reply_dmat, sc->reply_frames,
 		    sc->reply_map);
 	if (sc->reply_dmat != NULL)
 		bus_dma_tag_destroy(sc->reply_dmat);
 
 	if (sc->req_busaddr != 0)
 		bus_dmamap_unload(sc->req_dmat, sc->req_map);
 	if (sc->req_frames != NULL)
 		bus_dmamem_free(sc->req_dmat, sc->req_frames, sc->req_map);
 	if (sc->req_dmat != NULL)
 		bus_dma_tag_destroy(sc->req_dmat);
 
 	if (sc->chains != NULL)
 		free(sc->chains, M_MPT2);
 	if (sc->commands != NULL) {
 		for (i = 1; i < sc->num_reqs; i++) {
 			cm = &sc->commands[i];
 			bus_dmamap_destroy(sc->buffer_dmat, cm->cm_dmamap);
 		}
 		free(sc->commands, M_MPT2);
 	}
 	if (sc->buffer_dmat != NULL)
 		bus_dma_tag_destroy(sc->buffer_dmat);
 
 	mps_pci_free_interrupts(sc);
 	free(sc->queues, M_MPT2);
 	sc->queues = NULL;
 }
 
 /* 
  * The terms diag reset and hard reset are used interchangeably in the MPI
  * docs to mean resetting the controller chip.  In this code diag reset
  * cleans everything up, and the hard reset function just sends the reset
  * sequence to the chip.  This should probably be refactored so that every
  * subsystem gets a reset notification of some sort, and can clean up
  * appropriately.
  */
 int
 mps_reinit(struct mps_softc *sc)
 {
 	int error;
 	struct mpssas_softc *sassc;
 
 	sassc = sc->sassc;
 
 	MPS_FUNCTRACE(sc);
 
 	mtx_assert(&sc->mps_mtx, MA_OWNED);
 
 	mps_dprint(sc, MPS_INIT|MPS_INFO, "Reinitializing controller\n");
 	if (sc->mps_flags & MPS_FLAGS_DIAGRESET) {
 		mps_dprint(sc, MPS_INIT, "Reset already in progress\n");
 		return 0;
 	}
 
 	/* make sure the completion callbacks can recognize they're getting
 	 * a NULL cm_reply due to a reset.
 	 */
 	sc->mps_flags |= MPS_FLAGS_DIAGRESET;
 
 	/*
 	 * Mask interrupts here.
 	 */
 	mps_dprint(sc, MPS_INIT, "masking interrupts and resetting\n");
 	mps_mask_intr(sc);
 
 	error = mps_diag_reset(sc, CAN_SLEEP);
 	if (error != 0) {
 		/* XXXSL No need to panic here */
 		panic("%s hard reset failed with error %d\n",
 		    __func__, error);
 	}
 
 	/* Restore the PCI state, including the MSI-X registers */
 	mps_pci_restore(sc);
 
 	/* Give the I/O subsystem special priority to get itself prepared */
 	mpssas_handle_reinit(sc);
 
 	/*
 	 * Get IOC Facts and allocate all structures based on this information.
 	 * The attach function will also call mps_iocfacts_allocate at startup.
 	 * If relevant values have changed in IOC Facts, this function will free
 	 * all of the memory based on IOC Facts and reallocate that memory.
 	 */
 	if ((error = mps_iocfacts_allocate(sc, FALSE)) != 0) {
 		panic("%s IOC Facts based allocation failed with error %d\n",
 		    __func__, error);
 	}
 
 	/*
 	 * Mapping structures will be re-allocated after getting IOC Page8, so
 	 * free these structures here.
 	 */
 	mps_mapping_exit(sc);
 
 	/*
 	 * The static page function currently read is IOC Page8.  Others can be
 	 * added in future.  It's possible that the values in IOC Page8 have
 	 * changed after a Diag Reset due to user modification, so always read
 	 * these.  Interrupts are masked, so unmask them before getting config
 	 * pages.
 	 */
 	mps_unmask_intr(sc);
 	sc->mps_flags &= ~MPS_FLAGS_DIAGRESET;
 	mps_base_static_config_pages(sc);
 
 	/*
 	 * Some mapping info is based in IOC Page8 data, so re-initialize the
 	 * mapping tables.
 	 */
 	mps_mapping_initialize(sc);
 
 	/*
 	 * Restart will reload the event masks clobbered by the reset, and
 	 * then enable the port.
 	 */
 	mps_reregister_events(sc);
 
 	/* the end of discovery will release the simq, so we're done. */
 	mps_dprint(sc, MPS_INIT|MPS_XINFO, "Finished sc %p post %u free %u\n", 
 	    sc, sc->replypostindex, sc->replyfreeindex);
 
 	mpssas_release_simq_reinit(sassc);
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 
 	return 0;
 }
 
 /* Wait for the chip to ACK a word that we've put into its FIFO 
  * Wait for <timeout> seconds. In single loop wait for busy loop
  * for 500 microseconds.
  * Total is [ 0.5 * (2000 * <timeout>) ] in miliseconds.
  * */
 static int
 mps_wait_db_ack(struct mps_softc *sc, int timeout, int sleep_flag)
 {
 
 	u32 cntdn, count;
 	u32 int_status;
 	u32 doorbell;
 
 	count = 0;
 	cntdn = (sleep_flag == CAN_SLEEP) ? 1000*timeout : 2000*timeout;
 	do {
 		int_status = mps_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET);
 		if (!(int_status & MPI2_HIS_SYS2IOC_DB_STATUS)) {
 			mps_dprint(sc, MPS_TRACE, 
 			"%s: successful count(%d), timeout(%d)\n",
 			__func__, count, timeout);
 		return 0;
 		} else if (int_status & MPI2_HIS_IOC2SYS_DB_STATUS) {
 			doorbell = mps_regread(sc, MPI2_DOORBELL_OFFSET);
 			if ((doorbell & MPI2_IOC_STATE_MASK) ==
 				MPI2_IOC_STATE_FAULT) {
 				mps_dprint(sc, MPS_FAULT, 
 					"fault_state(0x%04x)!\n", doorbell);
 				return (EFAULT);
 			}
 		} else if (int_status == 0xFFFFFFFF)
 			goto out;
 
 		/* If it can sleep, sleep for 1 milisecond, else busy loop for 
 		* 0.5 milisecond */
 		if (mtx_owned(&sc->mps_mtx) && sleep_flag == CAN_SLEEP)
 			msleep(&sc->msleep_fake_chan, &sc->mps_mtx, 0, 
 			"mpsdba", hz/1000);
 		else if (sleep_flag == CAN_SLEEP)
 			pause("mpsdba", hz/1000);
 		else
 			DELAY(500);
 		count++;
 	} while (--cntdn);
 
 	out:
 	mps_dprint(sc, MPS_FAULT, "%s: failed due to timeout count(%d), "
 		"int_status(%x)!\n", __func__, count, int_status);
 	return (ETIMEDOUT);
 
 }
 
 /* Wait for the chip to signal that the next word in its FIFO can be fetched */
 static int
 mps_wait_db_int(struct mps_softc *sc)
 {
 	int retry;
 
 	for (retry = 0; retry < MPS_DB_MAX_WAIT; retry++) {
 		if ((mps_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET) &
 		    MPI2_HIS_IOC2SYS_DB_STATUS) != 0)
 			return (0);
 		DELAY(2000);
 	}
 	return (ETIMEDOUT);
 }
 
 /* Step through the synchronous command state machine, i.e. "Doorbell mode" */
 static int
 mps_request_sync(struct mps_softc *sc, void *req, MPI2_DEFAULT_REPLY *reply,
     int req_sz, int reply_sz, int timeout)
 {
 	uint32_t *data32;
 	uint16_t *data16;
 	int i, count, ioc_sz, residual;
 	int sleep_flags = CAN_SLEEP;
 
 	if (curthread->td_no_sleeping != 0)
 		sleep_flags = NO_SLEEP;
 
 	/* Step 1 */
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/* Step 2 */
 	if (mps_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED)
 		return (EBUSY);
 
 	/* Step 3
 	 * Announce that a message is coming through the doorbell.  Messages
 	 * are pushed at 32bit words, so round up if needed.
 	 */
 	count = (req_sz + 3) / 4;
 	mps_regwrite(sc, MPI2_DOORBELL_OFFSET,
 	    (MPI2_FUNCTION_HANDSHAKE << MPI2_DOORBELL_FUNCTION_SHIFT) |
 	    (count << MPI2_DOORBELL_ADD_DWORDS_SHIFT));
 
 	/* Step 4 */
 	if (mps_wait_db_int(sc) ||
 	    (mps_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED) == 0) {
 		mps_dprint(sc, MPS_FAULT, "Doorbell failed to activate\n");
 		return (ENXIO);
 	}
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	if (mps_wait_db_ack(sc, 5, sleep_flags) != 0) {
 		mps_dprint(sc, MPS_FAULT, "Doorbell handshake failed\n");
 		return (ENXIO);
 	}
 
 	/* Step 5 */
 	/* Clock out the message data synchronously in 32-bit dwords*/
 	data32 = (uint32_t *)req;
 	for (i = 0; i < count; i++) {
 		mps_regwrite(sc, MPI2_DOORBELL_OFFSET, htole32(data32[i]));
 		if (mps_wait_db_ack(sc, 5, sleep_flags) != 0) {
 			mps_dprint(sc, MPS_FAULT,
 			    "Timeout while writing doorbell\n");
 			return (ENXIO);
 		}
 	}
 
 	/* Step 6 */
 	/* Clock in the reply in 16-bit words.  The total length of the
 	 * message is always in the 4th byte, so clock out the first 2 words
 	 * manually, then loop the rest.
 	 */
 	data16 = (uint16_t *)reply;
 	if (mps_wait_db_int(sc) != 0) {
 		mps_dprint(sc, MPS_FAULT, "Timeout reading doorbell 0\n");
 		return (ENXIO);
 	}
 	data16[0] =
 	    mps_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_DATA_MASK;
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	if (mps_wait_db_int(sc) != 0) {
 		mps_dprint(sc, MPS_FAULT, "Timeout reading doorbell 1\n");
 		return (ENXIO);
 	}
 	data16[1] =
 	    mps_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_DATA_MASK;
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	/* Number of 32bit words in the message */
 	ioc_sz = reply->MsgLength;
 
 	/*
 	 * Figure out how many 16bit words to clock in without overrunning.
 	 * The precision loss with dividing reply_sz can safely be
 	 * ignored because the messages can only be multiples of 32bits.
 	 */
 	residual = 0;
 	count = MIN((reply_sz / 4), ioc_sz) * 2;
 	if (count < ioc_sz * 2) {
 		residual = ioc_sz * 2 - count;
 		mps_dprint(sc, MPS_ERROR, "Driver error, throwing away %d "
 		    "residual message words\n", residual);
 	}
 
 	for (i = 2; i < count; i++) {
 		if (mps_wait_db_int(sc) != 0) {
 			mps_dprint(sc, MPS_FAULT,
 			    "Timeout reading doorbell %d\n", i);
 			return (ENXIO);
 		}
 		data16[i] = mps_regread(sc, MPI2_DOORBELL_OFFSET) &
 		    MPI2_DOORBELL_DATA_MASK;
 		mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	}
 
 	/*
 	 * Pull out residual words that won't fit into the provided buffer.
 	 * This keeps the chip from hanging due to a driver programming
 	 * error.
 	 */
 	while (residual--) {
 		if (mps_wait_db_int(sc) != 0) {
 			mps_dprint(sc, MPS_FAULT,
 			    "Timeout reading doorbell\n");
 			return (ENXIO);
 		}
 		(void)mps_regread(sc, MPI2_DOORBELL_OFFSET);
 		mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 	}
 
 	/* Step 7 */
 	if (mps_wait_db_int(sc) != 0) {
 		mps_dprint(sc, MPS_FAULT, "Timeout waiting to exit doorbell\n");
 		return (ENXIO);
 	}
 	if (mps_regread(sc, MPI2_DOORBELL_OFFSET) & MPI2_DOORBELL_USED)
 		mps_dprint(sc, MPS_FAULT, "Warning, doorbell still active\n");
 	mps_regwrite(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET, 0x0);
 
 	return (0);
 }
 
 static void
 mps_enqueue_request(struct mps_softc *sc, struct mps_command *cm)
 {
 	reply_descriptor rd;
 	MPS_FUNCTRACE(sc);
 	mps_dprint(sc, MPS_TRACE, "SMID %u cm %p ccb %p\n",
 	    cm->cm_desc.Default.SMID, cm, cm->cm_ccb);
 
 	if (sc->mps_flags & MPS_FLAGS_ATTACH_DONE && !(sc->mps_flags & MPS_FLAGS_SHUTDOWN))
 		mtx_assert(&sc->mps_mtx, MA_OWNED);
 
 	if (++sc->io_cmds_active > sc->io_cmds_highwater)
 		sc->io_cmds_highwater++;
 	rd.u.low = cm->cm_desc.Words.Low;
 	rd.u.high = cm->cm_desc.Words.High;
 	rd.word = htole64(rd.word);
 
 	KASSERT(cm->cm_state == MPS_CM_STATE_BUSY, ("command not busy\n"));
 	cm->cm_state = MPS_CM_STATE_INQUEUE;
 
 	/* TODO-We may need to make below regwrite atomic */
 	mps_regwrite(sc, MPI2_REQUEST_DESCRIPTOR_POST_LOW_OFFSET,
 	    rd.u.low);
 	mps_regwrite(sc, MPI2_REQUEST_DESCRIPTOR_POST_HIGH_OFFSET,
 	    rd.u.high);
 }
 
 /*
  * Just the FACTS, ma'am.
  */
 static int
 mps_get_iocfacts(struct mps_softc *sc, MPI2_IOC_FACTS_REPLY *facts)
 {
 	MPI2_DEFAULT_REPLY *reply;
 	MPI2_IOC_FACTS_REQUEST request;
 	int error, req_sz, reply_sz;
 
 	MPS_FUNCTRACE(sc);
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	req_sz = sizeof(MPI2_IOC_FACTS_REQUEST);
 	reply_sz = sizeof(MPI2_IOC_FACTS_REPLY);
 	reply = (MPI2_DEFAULT_REPLY *)facts;
 
 	bzero(&request, req_sz);
 	request.Function = MPI2_FUNCTION_IOC_FACTS;
 	error = mps_request_sync(sc, &request, reply, req_sz, reply_sz, 5);
 	mps_dprint(sc, MPS_INIT, "%s exit error= %d\n", __func__, error);
 
 	return (error);
 }
 
 static int
 mps_send_iocinit(struct mps_softc *sc)
 {
 	MPI2_IOC_INIT_REQUEST	init;
 	MPI2_DEFAULT_REPLY	reply;
 	int req_sz, reply_sz, error;
 	struct timeval now;
 	uint64_t time_in_msec;
 
 	MPS_FUNCTRACE(sc);
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	/* Do a quick sanity check on proper initialization */
 	if ((sc->pqdepth == 0) || (sc->fqdepth == 0) || (sc->reqframesz == 0)
 	    || (sc->replyframesz == 0)) {
 		mps_dprint(sc, MPS_INIT|MPS_ERROR,
 		    "Driver not fully initialized for IOCInit\n");
 		return (EINVAL);
 	}
 
 	req_sz = sizeof(MPI2_IOC_INIT_REQUEST);
 	reply_sz = sizeof(MPI2_IOC_INIT_REPLY);
 	bzero(&init, req_sz);
 	bzero(&reply, reply_sz);
 
 	/*
 	 * Fill in the init block.  Note that most addresses are
 	 * deliberately in the lower 32bits of memory.  This is a micro-
 	 * optimzation for PCI/PCIX, though it's not clear if it helps PCIe.
 	 */
 	init.Function = MPI2_FUNCTION_IOC_INIT;
 	init.WhoInit = MPI2_WHOINIT_HOST_DRIVER;
 	init.MsgVersion = htole16(MPI2_VERSION);
 	init.HeaderVersion = htole16(MPI2_HEADER_VERSION);
 	init.SystemRequestFrameSize = htole16((uint16_t)(sc->reqframesz / 4));
 	init.ReplyDescriptorPostQueueDepth = htole16(sc->pqdepth);
 	init.ReplyFreeQueueDepth = htole16(sc->fqdepth);
 	init.SenseBufferAddressHigh = 0;
 	init.SystemReplyAddressHigh = 0;
 	init.SystemRequestFrameBaseAddress.High = 0;
 	init.SystemRequestFrameBaseAddress.Low = htole32((uint32_t)sc->req_busaddr);
 	init.ReplyDescriptorPostQueueAddress.High = 0;
 	init.ReplyDescriptorPostQueueAddress.Low = htole32((uint32_t)sc->post_busaddr);
 	init.ReplyFreeQueueAddress.High = 0;
 	init.ReplyFreeQueueAddress.Low = htole32((uint32_t)sc->free_busaddr);
 	getmicrotime(&now);
 	time_in_msec = (now.tv_sec * 1000 + now.tv_usec/1000);
 	init.TimeStamp.High = htole32((time_in_msec >> 32) & 0xFFFFFFFF);
 	init.TimeStamp.Low = htole32(time_in_msec & 0xFFFFFFFF);
 
 	error = mps_request_sync(sc, &init, &reply, req_sz, reply_sz, 5);
 	if ((reply.IOCStatus & MPI2_IOCSTATUS_MASK) != MPI2_IOCSTATUS_SUCCESS)
 		error = ENXIO;
 
 	mps_dprint(sc, MPS_INIT, "IOCInit status= 0x%x\n", reply.IOCStatus);
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 	return (error);
 }
 
 void
 mps_memaddr_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	bus_addr_t *addr;
 
 	addr = arg;
 	*addr = segs[0].ds_addr;
 }
 
 void
 mps_memaddr_wait_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mps_busdma_context *ctx;
 	int need_unload, need_free;
 
 	ctx = (struct mps_busdma_context *)arg;
 	need_unload = 0;
 	need_free = 0;
 
 	mps_lock(ctx->softc);
 	ctx->error = error;
 	ctx->completed = 1;
 	if ((error == 0) && (ctx->abandoned == 0)) {
 		*ctx->addr = segs[0].ds_addr;
 	} else {
 		if (nsegs != 0)
 			need_unload = 1;
 		if (ctx->abandoned != 0)
 			need_free = 1;
 	}
 	if (need_free == 0)
 		wakeup(ctx);
 
 	mps_unlock(ctx->softc);
 
 	if (need_unload != 0) {
 		bus_dmamap_unload(ctx->buffer_dmat,
 				  ctx->buffer_dmamap);
 		*ctx->addr = 0;
 	}
 
 	if (need_free != 0)
 		free(ctx, M_MPSUSER);
 }
 
 static int
 mps_alloc_queues(struct mps_softc *sc)
 {
 	struct mps_queue *q;
 	u_int nq, i;
 
 	nq = sc->msi_msgs;
 	mps_dprint(sc, MPS_INIT|MPS_XINFO, "Allocating %d I/O queues\n", nq);
 
 	sc->queues = malloc(sizeof(struct mps_queue) * nq, M_MPT2,
 	    M_NOWAIT|M_ZERO);
 	if (sc->queues == NULL)
 		return (ENOMEM);
 
 	for (i = 0; i < nq; i++) {
 		q = &sc->queues[i];
 		mps_dprint(sc, MPS_INIT, "Configuring queue %d %p\n", i, q);
 		q->sc = sc;
 		q->qnum = i;
 	}
 
 	return (0);
 }
 
 static int
 mps_alloc_hw_queues(struct mps_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	bus_addr_t queues_busaddr;
 	uint8_t *queues;
 	int qsize, fqsize, pqsize;
 
 	/*
 	 * The reply free queue contains 4 byte entries in multiples of 16 and
 	 * aligned on a 16 byte boundary. There must always be an unused entry.
 	 * This queue supplies fresh reply frames for the firmware to use.
 	 *
 	 * The reply descriptor post queue contains 8 byte entries in
 	 * multiples of 16 and aligned on a 16 byte boundary.  This queue
 	 * contains filled-in reply frames sent from the firmware to the host.
 	 *
 	 * These two queues are allocated together for simplicity.
 	 */
 	sc->fqdepth = roundup2(sc->num_replies + 1, 16);
 	sc->pqdepth = roundup2(sc->num_replies + 1, 16);
 	fqsize= sc->fqdepth * 4;
 	pqsize = sc->pqdepth * 8;
 	qsize = fqsize + pqsize;
 
 	bus_dma_template_init(&t, sc->mps_parent_dmat);
-	t.alignment = 16;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = qsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(16), BD_MAXSIZE(qsize),
+	    BD_MAXSEGSIZE(qsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->queues_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate queues DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->queues_dmat, (void **)&queues, BUS_DMA_NOWAIT,
 	    &sc->queues_map)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate queues memory\n");
 		return (ENOMEM);
         }
         bzero(queues, qsize);
         bus_dmamap_load(sc->queues_dmat, sc->queues_map, queues, qsize,
 	    mps_memaddr_cb, &queues_busaddr, 0);
 
 	sc->free_queue = (uint32_t *)queues;
 	sc->free_busaddr = queues_busaddr;
 	sc->post_queue = (MPI2_REPLY_DESCRIPTORS_UNION *)(queues + fqsize);
 	sc->post_busaddr = queues_busaddr + fqsize;
 	mps_dprint(sc, MPS_INIT, "free queue busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->free_busaddr, fqsize);
 	mps_dprint(sc, MPS_INIT, "reply queue busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->post_busaddr, pqsize);
 
 	return (0);
 }
 
 static int
 mps_alloc_replies(struct mps_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	int rsize, num_replies;
 
 	/* Store the reply frame size in bytes rather than as 32bit words */
 	sc->replyframesz = sc->facts->ReplyFrameSize * 4;
 
 	/*
 	 * sc->num_replies should be one less than sc->fqdepth.  We need to
 	 * allocate space for sc->fqdepth replies, but only sc->num_replies
 	 * replies can be used at once.
 	 */
 	num_replies = max(sc->fqdepth, sc->num_replies);
 
 	rsize = sc->replyframesz * num_replies; 
 	bus_dma_template_init(&t, sc->mps_parent_dmat);
-	t.alignment = 4;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(4), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->reply_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate replies DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->reply_dmat, (void **)&sc->reply_frames,
 	    BUS_DMA_NOWAIT, &sc->reply_map)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate replies memory\n");
 		return (ENOMEM);
         }
         bzero(sc->reply_frames, rsize);
         bus_dmamap_load(sc->reply_dmat, sc->reply_map, sc->reply_frames, rsize,
 	    mps_memaddr_cb, &sc->reply_busaddr, 0);
 
 	mps_dprint(sc, MPS_INIT, "reply frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->reply_busaddr, rsize);
 
 	return (0);
 }
 
 static void
 mps_load_chains_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mps_softc *sc = arg;
 	struct mps_chain *chain;
 	bus_size_t bo;
 	int i, o, s;
 
 	if (error != 0)
 		return;
 
 	for (i = 0, o = 0, s = 0; s < nsegs; s++) {
 		for (bo = 0; bo + sc->reqframesz <= segs[s].ds_len;
 		    bo += sc->reqframesz) {
 			chain = &sc->chains[i++];
 			chain->chain =(MPI2_SGE_IO_UNION *)(sc->chain_frames+o);
 			chain->chain_busaddr = segs[s].ds_addr + bo;
 			o += sc->reqframesz;
 			mps_free_chain(sc, chain);
 		}
 		if (bo != segs[s].ds_len)
 			o += segs[s].ds_len - bo;
 	}
 	sc->chain_free_lowwater = i;
 }
 
 static int
 mps_alloc_requests(struct mps_softc *sc)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	struct mps_command *cm;
 	int i, rsize, nsegs;
 
 	rsize = sc->reqframesz * sc->num_reqs;
 	bus_dma_template_init(&t, sc->mps_parent_dmat);
-	t.alignment = 16;
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(16), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize), BD_NSEGMENTS(1),
+	    BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
         if (bus_dma_template_tag(&t, &sc->req_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate request DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->req_dmat, (void **)&sc->req_frames,
 	    BUS_DMA_NOWAIT, &sc->req_map)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate request memory\n");
 		return (ENOMEM);
         }
         bzero(sc->req_frames, rsize);
         bus_dmamap_load(sc->req_dmat, sc->req_map, sc->req_frames, rsize,
 	    mps_memaddr_cb, &sc->req_busaddr, 0);
 	mps_dprint(sc, MPS_INIT, "request frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->req_busaddr, rsize);
 
 	sc->chains = malloc(sizeof(struct mps_chain) * sc->num_chains, M_MPT2,
 	    M_NOWAIT | M_ZERO);
 	if (!sc->chains) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate chain memory\n");
 		return (ENOMEM);
 	}
 	rsize = sc->reqframesz * sc->num_chains;
 	bus_dma_template_clone(&t, sc->req_dmat);
-	t.maxsize = t.maxsegsize = rsize;
-	t.nsegments = howmany(rsize, PAGE_SIZE);
+	BUS_DMA_TEMPLATE_FILL(&t, BD_MAXSIZE(rsize), BD_MAXSEGSIZE(rsize),
+	    BD_NSEGMENTS(howmany(rsize, PAGE_SIZE)));
 	if (bus_dma_template_tag(&t, &sc->chain_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate chain DMA tag\n");
 		return (ENOMEM);
 	}
 	if (bus_dmamem_alloc(sc->chain_dmat, (void **)&sc->chain_frames,
 	    BUS_DMA_NOWAIT | BUS_DMA_ZERO, &sc->chain_map)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate chain memory\n");
 		return (ENOMEM);
 	}
 	if (bus_dmamap_load(sc->chain_dmat, sc->chain_map, sc->chain_frames,
 	    rsize, mps_load_chains_cb, sc, BUS_DMA_NOWAIT)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot load chain memory\n");
 		bus_dmamem_free(sc->chain_dmat, sc->chain_frames,
 		    sc->chain_map);
 		return (ENOMEM);
 	}
 
 	rsize = MPS_SENSE_LEN * sc->num_reqs;
 	bus_dma_template_clone(&t, sc->req_dmat);
-	t.maxsize = t.maxsegsize = rsize;
-	t.alignment = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_ALIGNMENT(1), BD_MAXSIZE(rsize),
+	    BD_MAXSEGSIZE(rsize));
         if (bus_dma_template_tag(&t, &sc->sense_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate sense DMA tag\n");
 		return (ENOMEM);
         }
         if (bus_dmamem_alloc(sc->sense_dmat, (void **)&sc->sense_frames,
 	    BUS_DMA_NOWAIT, &sc->sense_map)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate sense memory\n");
 		return (ENOMEM);
         }
         bzero(sc->sense_frames, rsize);
         bus_dmamap_load(sc->sense_dmat, sc->sense_map, sc->sense_frames, rsize,
 	    mps_memaddr_cb, &sc->sense_busaddr, 0);
 	mps_dprint(sc, MPS_INIT, "sense frames busaddr= %#016jx size= %d\n",
 	    (uintmax_t)sc->sense_busaddr, rsize);
 
 	nsegs = (sc->maxio / PAGE_SIZE) + 1;
 	bus_dma_template_init(&t, sc->mps_parent_dmat);
-	t.maxsize = BUS_SPACE_MAXSIZE_32BIT;
-	t.nsegments = nsegs;
-	t.maxsegsize = BUS_SPACE_MAXSIZE_24BIT;
-	t.flags = BUS_DMA_ALLOCNOW;
-	t.lockfunc = busdma_lock_mutex;
-	t.lockfuncarg = &sc->mps_mtx;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_MAXSIZE(BUS_SPACE_MAXSIZE_32BIT),
+	    BD_NSEGMENTS(nsegs), BD_MAXSEGSIZE(BUS_SPACE_MAXSIZE_24BIT),
+	    BD_FLAGS(BUS_DMA_ALLOCNOW), BD_LOCKFUNC(busdma_lock_mutex),
+	    BD_LOCKFUNCARG(&sc->mps_mtx));
         if (bus_dma_template_tag(&t, &sc->buffer_dmat)) {
 		mps_dprint(sc, MPS_ERROR, "Cannot allocate buffer DMA tag\n");
 		return (ENOMEM);
         }
 
 	/*
 	 * SMID 0 cannot be used as a free command per the firmware spec.
 	 * Just drop that command instead of risking accounting bugs.
 	 */
 	sc->commands = malloc(sizeof(struct mps_command) * sc->num_reqs,
 	    M_MPT2, M_WAITOK | M_ZERO);
 	for (i = 1; i < sc->num_reqs; i++) {
 		cm = &sc->commands[i];
 		cm->cm_req = sc->req_frames + i * sc->reqframesz;
 		cm->cm_req_busaddr = sc->req_busaddr + i * sc->reqframesz;
 		cm->cm_sense = &sc->sense_frames[i];
 		cm->cm_sense_busaddr = sc->sense_busaddr + i * MPS_SENSE_LEN;
 		cm->cm_desc.Default.SMID = i;
 		cm->cm_sc = sc;
 		cm->cm_state = MPS_CM_STATE_BUSY;
 		TAILQ_INIT(&cm->cm_chain_list);
 		callout_init_mtx(&cm->cm_callout, &sc->mps_mtx, 0);
 
 		/* XXX Is a failure here a critical problem? */
 		if (bus_dmamap_create(sc->buffer_dmat, 0, &cm->cm_dmamap) == 0)
 			if (i <= sc->num_prireqs)
 				mps_free_high_priority_command(sc, cm);
 			else
 				mps_free_command(sc, cm);
 		else {
 			panic("failed to allocate command %d\n", i);
 			sc->num_reqs = i;
 			break;
 		}
 	}
 
 	return (0);
 }
 
 static int
 mps_init_queues(struct mps_softc *sc)
 {
 	int i;
 
 	memset((uint8_t *)sc->post_queue, 0xff, sc->pqdepth * 8);
 
 	/*
 	 * According to the spec, we need to use one less reply than we
 	 * have space for on the queue.  So sc->num_replies (the number we
 	 * use) should be less than sc->fqdepth (allocated size).
 	 */
 	if (sc->num_replies >= sc->fqdepth)
 		return (EINVAL);
 
 	/*
 	 * Initialize all of the free queue entries.
 	 */
 	for (i = 0; i < sc->fqdepth; i++)
 		sc->free_queue[i] = sc->reply_busaddr + (i * sc->replyframesz);
 	sc->replyfreeindex = sc->num_replies;
 
 	return (0);
 }
 
 /* Get the driver parameter tunables.  Lowest priority are the driver defaults.
  * Next are the global settings, if they exist.  Highest are the per-unit
  * settings, if they exist.
  */
 void
 mps_get_tunables(struct mps_softc *sc)
 {
 	char tmpstr[80], mps_debug[80];
 
 	/* XXX default to some debugging for now */
 	sc->mps_debug = MPS_INFO|MPS_FAULT;
 	sc->disable_msix = 0;
 	sc->disable_msi = 0;
 	sc->max_msix = MPS_MSIX_MAX;
 	sc->max_chains = MPS_CHAIN_FRAMES;
 	sc->max_io_pages = MPS_MAXIO_PAGES;
 	sc->enable_ssu = MPS_SSU_ENABLE_SSD_DISABLE_HDD;
 	sc->spinup_wait_time = DEFAULT_SPINUP_WAIT;
 	sc->use_phynum = 1;
 	sc->max_reqframes = MPS_REQ_FRAMES;
 	sc->max_prireqframes = MPS_PRI_REQ_FRAMES;
 	sc->max_replyframes = MPS_REPLY_FRAMES;
 	sc->max_evtframes = MPS_EVT_REPLY_FRAMES;
 
 	/*
 	 * Grab the global variables.
 	 */
 	bzero(mps_debug, 80);
 	if (TUNABLE_STR_FETCH("hw.mps.debug_level", mps_debug, 80) != 0)
 		mps_parse_debug(sc, mps_debug);
 	TUNABLE_INT_FETCH("hw.mps.disable_msix", &sc->disable_msix);
 	TUNABLE_INT_FETCH("hw.mps.disable_msi", &sc->disable_msi);
 	TUNABLE_INT_FETCH("hw.mps.max_msix", &sc->max_msix);
 	TUNABLE_INT_FETCH("hw.mps.max_chains", &sc->max_chains);
 	TUNABLE_INT_FETCH("hw.mps.max_io_pages", &sc->max_io_pages);
 	TUNABLE_INT_FETCH("hw.mps.enable_ssu", &sc->enable_ssu);
 	TUNABLE_INT_FETCH("hw.mps.spinup_wait_time", &sc->spinup_wait_time);
 	TUNABLE_INT_FETCH("hw.mps.use_phy_num", &sc->use_phynum);
 	TUNABLE_INT_FETCH("hw.mps.max_reqframes", &sc->max_reqframes);
 	TUNABLE_INT_FETCH("hw.mps.max_prireqframes", &sc->max_prireqframes);
 	TUNABLE_INT_FETCH("hw.mps.max_replyframes", &sc->max_replyframes);
 	TUNABLE_INT_FETCH("hw.mps.max_evtframes", &sc->max_evtframes);
 
 	/* Grab the unit-instance variables */
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.debug_level",
 	    device_get_unit(sc->mps_dev));
 	bzero(mps_debug, 80);
 	if (TUNABLE_STR_FETCH(tmpstr, mps_debug, 80) != 0)
 		mps_parse_debug(sc, mps_debug);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.disable_msix",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->disable_msix);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.disable_msi",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->disable_msi);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_msix",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_msix);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_chains",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_chains);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_io_pages",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_io_pages);
 
 	bzero(sc->exclude_ids, sizeof(sc->exclude_ids));
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.exclude_ids",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_STR_FETCH(tmpstr, sc->exclude_ids, sizeof(sc->exclude_ids));
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.enable_ssu",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->enable_ssu);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.spinup_wait_time",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->spinup_wait_time);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.use_phy_num",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->use_phynum);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_reqframes",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_reqframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_prireqframes",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_prireqframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_replyframes",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_replyframes);
 
 	snprintf(tmpstr, sizeof(tmpstr), "dev.mps.%d.max_evtframes",
 	    device_get_unit(sc->mps_dev));
 	TUNABLE_INT_FETCH(tmpstr, &sc->max_evtframes);
 
 }
 
 static void
 mps_setup_sysctl(struct mps_softc *sc)
 {
 	struct sysctl_ctx_list	*sysctl_ctx = NULL;
 	struct sysctl_oid	*sysctl_tree = NULL;
 	char tmpstr[80], tmpstr2[80];
 
 	/*
 	 * Setup the sysctl variable so the user can change the debug level
 	 * on the fly.
 	 */
 	snprintf(tmpstr, sizeof(tmpstr), "MPS controller %d",
 	    device_get_unit(sc->mps_dev));
 	snprintf(tmpstr2, sizeof(tmpstr2), "%d", device_get_unit(sc->mps_dev));
 
 	sysctl_ctx = device_get_sysctl_ctx(sc->mps_dev);
 	if (sysctl_ctx != NULL)
 		sysctl_tree = device_get_sysctl_tree(sc->mps_dev);
 
 	if (sysctl_tree == NULL) {
 		sysctl_ctx_init(&sc->sysctl_ctx);
 		sc->sysctl_tree = SYSCTL_ADD_NODE(&sc->sysctl_ctx,
 		    SYSCTL_STATIC_CHILDREN(_hw_mps), OID_AUTO, tmpstr2,
 		    CTLFLAG_RD | CTLFLAG_MPSAFE, 0, tmpstr);
 		if (sc->sysctl_tree == NULL)
 			return;
 		sysctl_ctx = &sc->sysctl_ctx;
 		sysctl_tree = sc->sysctl_tree;
 	}
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "debug_level", CTLTYPE_STRING | CTLFLAG_RW |CTLFLAG_MPSAFE,
 	    sc, 0, mps_debug_sysctl, "A", "mps debug level");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "disable_msix", CTLFLAG_RD, &sc->disable_msix, 0,
 	    "Disable the use of MSI-X interrupts");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "disable_msi", CTLFLAG_RD, &sc->disable_msi, 0,
 	    "Disable the use of MSI interrupts");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_msix", CTLFLAG_RD, &sc->max_msix, 0,
 	    "User-defined maximum number of MSIX queues");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "msix_msgs", CTLFLAG_RD, &sc->msi_msgs, 0,
 	    "Negotiated number of MSIX queues");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_reqframes", CTLFLAG_RD, &sc->max_reqframes, 0,
 	    "Total number of allocated request frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_prireqframes", CTLFLAG_RD, &sc->max_prireqframes, 0,
 	    "Total number of allocated high priority request frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_replyframes", CTLFLAG_RD, &sc->max_replyframes, 0,
 	    "Total number of allocated reply frames");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_evtframes", CTLFLAG_RD, &sc->max_evtframes, 0,
 	    "Total number of event frames allocated");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "firmware_version", CTLFLAG_RD, sc->fw_version,
 	    strlen(sc->fw_version), "firmware version");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "driver_version", CTLFLAG_RD, MPS_DRIVER_VERSION,
 	    strlen(MPS_DRIVER_VERSION), "driver version");
 
 	SYSCTL_ADD_STRING(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "msg_version", CTLFLAG_RD, sc->msg_version,
 	    strlen(sc->msg_version), "message interface version");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "io_cmds_active", CTLFLAG_RD,
 	    &sc->io_cmds_active, 0, "number of currently active commands");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "io_cmds_highwater", CTLFLAG_RD,
 	    &sc->io_cmds_highwater, 0, "maximum active commands seen");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_free", CTLFLAG_RD,
 	    &sc->chain_free, 0, "number of free chain elements");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_free_lowwater", CTLFLAG_RD,
 	    &sc->chain_free_lowwater, 0,"lowest number of free chain elements");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_chains", CTLFLAG_RD,
 	    &sc->max_chains, 0,"maximum chain frames that will be allocated");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "max_io_pages", CTLFLAG_RD,
 	    &sc->max_io_pages, 0,"maximum pages to allow per I/O (if <1 use "
 	    "IOCFacts)");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "enable_ssu", CTLFLAG_RW, &sc->enable_ssu, 0,
 	    "enable SSU to SATA SSD/HDD at shutdown");
 
 	SYSCTL_ADD_UQUAD(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "chain_alloc_fail", CTLFLAG_RD,
 	    &sc->chain_alloc_fail, "chain allocation failures");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "spinup_wait_time", CTLFLAG_RD,
 	    &sc->spinup_wait_time, DEFAULT_SPINUP_WAIT, "seconds to wait for "
 	    "spinup after SATA ID error");
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "mapping_table_dump",
 	    CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_NEEDGIANT, sc, 0,
 	    mps_mapping_dump, "A", "Mapping Table Dump");
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "encl_table_dump",
 	    CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_NEEDGIANT, sc, 0,
 	    mps_mapping_encl_dump, "A", "Enclosure Table Dump");
 
 	SYSCTL_ADD_PROC(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "dump_reqs",
 	    CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_SKIP | CTLFLAG_NEEDGIANT,
 	    sc, 0, mps_dump_reqs, "I", "Dump Active Requests");
 
 	SYSCTL_ADD_INT(sysctl_ctx, SYSCTL_CHILDREN(sysctl_tree),
 	    OID_AUTO, "use_phy_num", CTLFLAG_RD, &sc->use_phynum, 0,
 	    "Use the phy number for enumeration");
 }
 
 static struct mps_debug_string {
 	char	*name;
 	int	flag;
 } mps_debug_strings[] = {
 	{"info", MPS_INFO},
 	{"fault", MPS_FAULT},
 	{"event", MPS_EVENT},
 	{"log", MPS_LOG},
 	{"recovery", MPS_RECOVERY},
 	{"error", MPS_ERROR},
 	{"init", MPS_INIT},
 	{"xinfo", MPS_XINFO},
 	{"user", MPS_USER},
 	{"mapping", MPS_MAPPING},
 	{"trace", MPS_TRACE}
 };
 
 enum mps_debug_level_combiner {
 	COMB_NONE,
 	COMB_ADD,
 	COMB_SUB
 };
 
 static int
 mps_debug_sysctl(SYSCTL_HANDLER_ARGS)
 {
 	struct mps_softc *sc;
 	struct mps_debug_string *string;
 	struct sbuf *sbuf;
 	char *buffer;
 	size_t sz;
 	int i, len, debug, error;
 
 	sc = (struct mps_softc *)arg1;
 
 	error = sysctl_wire_old_buffer(req, 0);
 	if (error != 0)
 		return (error);
 
 	sbuf = sbuf_new_for_sysctl(NULL, NULL, 128, req);
 	debug = sc->mps_debug;
 
 	sbuf_printf(sbuf, "%#x", debug);
 
 	sz = sizeof(mps_debug_strings) / sizeof(mps_debug_strings[0]);
 	for (i = 0; i < sz; i++) {
 		string = &mps_debug_strings[i];
 		if (debug & string->flag)
 			sbuf_printf(sbuf, ",%s", string->name);
 	}
 
 	error = sbuf_finish(sbuf);
 	sbuf_delete(sbuf);
 
 	if (error || req->newptr == NULL)
 		return (error);
 
 	len = req->newlen - req->newidx;
 	if (len == 0)
 		return (0);
 
 	buffer = malloc(len, M_MPT2, M_ZERO|M_WAITOK);
 	error = SYSCTL_IN(req, buffer, len);
 
 	mps_parse_debug(sc, buffer);
 
 	free(buffer, M_MPT2);
 	return (error);
 }
 
 static void
 mps_parse_debug(struct mps_softc *sc, char *list)
 {
 	struct mps_debug_string *string;
 	enum mps_debug_level_combiner op;
 	char *token, *endtoken;
 	size_t sz;
 	int flags, i;
 
 	if (list == NULL || *list == '\0')
 		return;
 
 	if (*list == '+') {
 		op = COMB_ADD;
 		list++;
 	} else if (*list == '-') {
 		op = COMB_SUB;
 		list++;
 	} else
 		op = COMB_NONE;
 	if (*list == '\0')
 		return;
 
 	flags = 0;
 	sz = sizeof(mps_debug_strings) / sizeof(mps_debug_strings[0]);
 	while ((token = strsep(&list, ":,")) != NULL) {
 		/* Handle integer flags */
 		flags |= strtol(token, &endtoken, 0);
 		if (token != endtoken)
 			continue;
 
 		/* Handle text flags */
 		for (i = 0; i < sz; i++) {
 			string = &mps_debug_strings[i];
 			if (strcasecmp(token, string->name) == 0) {
 				flags |= string->flag;
 				break;
 			}
 		}
 	}
 
 	switch (op) {
 	case COMB_NONE:
 		sc->mps_debug = flags;
 		break;
 	case COMB_ADD:
 		sc->mps_debug |= flags;
 		break;
 	case COMB_SUB:
 		sc->mps_debug &= (~flags);
 		break;
 	}
 
 	return;
 }
 
 struct mps_dumpreq_hdr {
 	uint32_t	smid;
 	uint32_t	state;
 	uint32_t	numframes;
 	uint32_t	deschi;
 	uint32_t	desclo;
 };
 
 static int
 mps_dump_reqs(SYSCTL_HANDLER_ARGS)
 {
 	struct mps_softc *sc;
 	struct mps_chain *chain, *chain1;
 	struct mps_command *cm;
 	struct mps_dumpreq_hdr hdr;
 	struct sbuf *sb;
 	uint32_t smid, state;
 	int i, numreqs, error = 0;
 
 	sc = (struct mps_softc *)arg1;
 
 	if ((error = priv_check(curthread, PRIV_DRIVER)) != 0) {
 		printf("priv check error %d\n", error);
 		return (error);
 	}
 
 	state = MPS_CM_STATE_INQUEUE;
 	smid = 1;
 	numreqs = sc->num_reqs;
 
 	if (req->newptr != NULL)
 		return (EINVAL);
 
 	if (smid == 0 || smid > sc->num_reqs)
 		return (EINVAL);
 	if (numreqs <= 0 || (numreqs + smid > sc->num_reqs))
 		numreqs = sc->num_reqs;
 	sb = sbuf_new_for_sysctl(NULL, NULL, 4096, req);
 
 	/* Best effort, no locking */
 	for (i = smid; i < numreqs; i++) {
 		cm = &sc->commands[i];
 		if (cm->cm_state != state)
 			continue;
 		hdr.smid = i;
 		hdr.state = cm->cm_state;
 		hdr.numframes = 1;
 		hdr.deschi = cm->cm_desc.Words.High;
 		hdr.desclo = cm->cm_desc.Words.Low;
 		TAILQ_FOREACH_SAFE(chain, &cm->cm_chain_list, chain_link,
 		   chain1)
 			hdr.numframes++;
 		sbuf_bcat(sb, &hdr, sizeof(hdr));
 		sbuf_bcat(sb, cm->cm_req, 128);
 		TAILQ_FOREACH_SAFE(chain, &cm->cm_chain_list, chain_link,
 		    chain1)
 			sbuf_bcat(sb, chain->chain, 128);
 	}
 
 	error = sbuf_finish(sb);
 	sbuf_delete(sb);
 	return (error);
 }
 
 int
 mps_attach(struct mps_softc *sc)
 {
 	int error;
 
 	MPS_FUNCTRACE(sc);
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	mtx_init(&sc->mps_mtx, "MPT2SAS lock", NULL, MTX_DEF);
 	callout_init_mtx(&sc->periodic, &sc->mps_mtx, 0);
 	callout_init_mtx(&sc->device_check_callout, &sc->mps_mtx, 0);
 	TAILQ_INIT(&sc->event_list);
 	timevalclear(&sc->lastfail);
 
 	if ((error = mps_transition_ready(sc)) != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "failed to transition "
 		    "ready\n");
 		return (error);
 	}
 
 	sc->facts = malloc(sizeof(MPI2_IOC_FACTS_REPLY), M_MPT2,
 	    M_ZERO|M_NOWAIT);
 	if(!sc->facts) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "Cannot allocate memory, "
 		    "exit\n");
 		return (ENOMEM);
 	}
 
 	/*
 	 * Get IOC Facts and allocate all structures based on this information.
 	 * A Diag Reset will also call mps_iocfacts_allocate and re-read the IOC
 	 * Facts. If relevant values have changed in IOC Facts, this function
 	 * will free all of the memory based on IOC Facts and reallocate that
 	 * memory.  If this fails, any allocated memory should already be freed.
 	 */
 	if ((error = mps_iocfacts_allocate(sc, TRUE)) != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "IOC Facts based allocation "
 		    "failed with error %d, exit\n", error);
 		return (error);
 	}
 
 	/* Start the periodic watchdog check on the IOC Doorbell */
 	mps_periodic(sc);
 
 	/*
 	 * The portenable will kick off discovery events that will drive the
 	 * rest of the initialization process.  The CAM/SAS module will
 	 * hold up the boot sequence until discovery is complete.
 	 */
 	sc->mps_ich.ich_func = mps_startup;
 	sc->mps_ich.ich_arg = sc;
 	if (config_intrhook_establish(&sc->mps_ich) != 0) {
 		mps_dprint(sc, MPS_INIT|MPS_ERROR,
 		    "Cannot establish MPS config hook\n");
 		error = EINVAL;
 	}
 
 	/*
 	 * Allow IR to shutdown gracefully when shutdown occurs.
 	 */
 	sc->shutdown_eh = EVENTHANDLER_REGISTER(shutdown_final,
 	    mpssas_ir_shutdown, sc, SHUTDOWN_PRI_DEFAULT);
 
 	if (sc->shutdown_eh == NULL)
 		mps_dprint(sc, MPS_INIT|MPS_ERROR,
 		    "shutdown event registration failed\n");
 
 	mps_setup_sysctl(sc);
 
 	sc->mps_flags |= MPS_FLAGS_ATTACH_DONE;
 	mps_dprint(sc, MPS_INIT, "%s exit error= %d\n", __func__, error);
 
 	return (error);
 }
 
 /* Run through any late-start handlers. */
 static void
 mps_startup(void *arg)
 {
 	struct mps_softc *sc;
 
 	sc = (struct mps_softc *)arg;
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 
 	mps_lock(sc);
 	mps_unmask_intr(sc);
 
 	/* initialize device mapping tables */
 	mps_base_static_config_pages(sc);
 	mps_mapping_initialize(sc);
 	mpssas_startup(sc);
 	mps_unlock(sc);
 
 	mps_dprint(sc, MPS_INIT, "disestablish config intrhook\n");
 	config_intrhook_disestablish(&sc->mps_ich);
 	sc->mps_ich.ich_arg = NULL;
 
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 }
 
 /* Periodic watchdog.  Is called with the driver lock already held. */
 static void
 mps_periodic(void *arg)
 {
 	struct mps_softc *sc;
 	uint32_t db;
 
 	sc = (struct mps_softc *)arg;
 	if (sc->mps_flags & MPS_FLAGS_SHUTDOWN)
 		return;
 
 	db = mps_regread(sc, MPI2_DOORBELL_OFFSET);
 	if ((db & MPI2_IOC_STATE_MASK) == MPI2_IOC_STATE_FAULT) {
 		mps_dprint(sc, MPS_FAULT, "IOC Fault 0x%08x, Resetting\n", db);
 		mps_reinit(sc);
 	}
 
 	callout_reset(&sc->periodic, MPS_PERIODIC_DELAY * hz, mps_periodic, sc);
 }
 
 static void
 mps_log_evt_handler(struct mps_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *event)
 {
 	MPI2_EVENT_DATA_LOG_ENTRY_ADDED *entry;
 
 	MPS_DPRINT_EVENT(sc, generic, event);
 
 	switch (event->Event) {
 	case MPI2_EVENT_LOG_DATA:
 		mps_dprint(sc, MPS_EVENT, "MPI2_EVENT_LOG_DATA:\n");
 		if (sc->mps_debug & MPS_EVENT)
 			hexdump(event->EventData, event->EventDataLength, NULL, 0);
 		break;
 	case MPI2_EVENT_LOG_ENTRY_ADDED:
 		entry = (MPI2_EVENT_DATA_LOG_ENTRY_ADDED *)event->EventData;
 		mps_dprint(sc, MPS_EVENT, "MPI2_EVENT_LOG_ENTRY_ADDED event "
 		    "0x%x Sequence %d:\n", entry->LogEntryQualifier,
 		     entry->LogSequence);
 		break;
 	default:
 		break;
 	}
 	return;
 }
 
 static int
 mps_attach_log(struct mps_softc *sc)
 {
 	u32 events[MPI2_EVENT_NOTIFY_EVENTMASK_WORDS];
 
 	bzero(events, 16);
 	setbit(events, MPI2_EVENT_LOG_DATA);
 	setbit(events, MPI2_EVENT_LOG_ENTRY_ADDED);
 
 	mps_register_events(sc, events, mps_log_evt_handler, NULL,
 	    &sc->mps_log_eh);
 
 	return (0);
 }
 
 static int
 mps_detach_log(struct mps_softc *sc)
 {
 
 	if (sc->mps_log_eh != NULL)
 		mps_deregister_events(sc, sc->mps_log_eh);
 	return (0);
 }
 
 /*
  * Free all of the driver resources and detach submodules.  Should be called
  * without the lock held.
  */
 int
 mps_free(struct mps_softc *sc)
 {
 	int error;
 
 	mps_dprint(sc, MPS_INIT, "%s entered\n", __func__);
 	/* Turn off the watchdog */
 	mps_lock(sc);
 	sc->mps_flags |= MPS_FLAGS_SHUTDOWN;
 	mps_unlock(sc);
 	/* Lock must not be held for this */
 	callout_drain(&sc->periodic);
 	callout_drain(&sc->device_check_callout);
 
 	if (((error = mps_detach_log(sc)) != 0) ||
 	    ((error = mps_detach_sas(sc)) != 0)) {
 		mps_dprint(sc, MPS_INIT|MPS_FAULT, "failed to detach "
 		    "subsystems, exit\n");
 		return (error);
 	}
 
 	mps_detach_user(sc);
 
 	/* Put the IOC back in the READY state. */
 	mps_lock(sc);
 	if ((error = mps_transition_ready(sc)) != 0) {
 		mps_unlock(sc);
 		return (error);
 	}
 	mps_unlock(sc);
 
 	if (sc->facts != NULL)
 		free(sc->facts, M_MPT2);
 
 	/*
 	 * Free all buffers that are based on IOC Facts.  A Diag Reset may need
 	 * to free these buffers too.
 	 */
 	mps_iocfacts_free(sc);
 
 	if (sc->sysctl_tree != NULL)
 		sysctl_ctx_free(&sc->sysctl_ctx);
 
 	/* Deregister the shutdown function */
 	if (sc->shutdown_eh != NULL)
 		EVENTHANDLER_DEREGISTER(shutdown_final, sc->shutdown_eh);
 
 	mtx_destroy(&sc->mps_mtx);
 	mps_dprint(sc, MPS_INIT, "%s exit\n", __func__);
 
 	return (0);
 }
 
 static __inline void
 mps_complete_command(struct mps_softc *sc, struct mps_command *cm)
 {
 	MPS_FUNCTRACE(sc);
 
 	if (cm == NULL) {
 		mps_dprint(sc, MPS_ERROR, "Completing NULL command\n");
 		return;
 	}
 
 	if (cm->cm_flags & MPS_CM_FLAGS_POLLED)
 		cm->cm_flags |= MPS_CM_FLAGS_COMPLETE;
 
 	if (cm->cm_complete != NULL) {
 		mps_dprint(sc, MPS_TRACE,
 			   "%s cm %p calling cm_complete %p data %p reply %p\n",
 			   __func__, cm, cm->cm_complete, cm->cm_complete_data,
 			   cm->cm_reply);
 		cm->cm_complete(sc, cm);
 	}
 
 	if (cm->cm_flags & MPS_CM_FLAGS_WAKEUP) {
 		mps_dprint(sc, MPS_TRACE, "waking up %p\n", cm);
 		wakeup(cm);
 	}
 
 	if (cm->cm_sc->io_cmds_active != 0) {
 		cm->cm_sc->io_cmds_active--;
 	} else {
 		mps_dprint(sc, MPS_ERROR, "Warning: io_cmds_active is "
 		    "out of sync - resynching to 0\n");
 	}
 }
 
 static void
 mps_sas_log_info(struct mps_softc *sc , u32 log_info)
 {
 	union loginfo_type {
 		u32     loginfo;
 		struct {
 			u32     subcode:16;
 			u32     code:8;
 			u32     originator:4;
 			u32     bus_type:4;
 		} dw;
 	};
 	union loginfo_type sas_loginfo;
 	char *originator_str = NULL;
 
 	sas_loginfo.loginfo = log_info;
 	if (sas_loginfo.dw.bus_type != 3 /*SAS*/)
 		return;
 
 	/* each nexus loss loginfo */
 	if (log_info == 0x31170000)
 		return;
 
 	/* eat the loginfos associated with task aborts */
 	if ((log_info == 30050000 || log_info ==
 	    0x31140000 || log_info == 0x31130000))
 		return;
 
 	switch (sas_loginfo.dw.originator) {
 	case 0:
 		originator_str = "IOP";
 		break;
 	case 1:
 		originator_str = "PL";
 		break;
 	case 2:
 		originator_str = "IR";
 		break;
 }
 
 	mps_dprint(sc, MPS_LOG, "log_info(0x%08x): originator(%s), "
 	"code(0x%02x), sub_code(0x%04x)\n", log_info,
 	originator_str, sas_loginfo.dw.code,
 	sas_loginfo.dw.subcode);
 }
 
 static void
 mps_display_reply_info(struct mps_softc *sc, uint8_t *reply)
 {
 	MPI2DefaultReply_t *mpi_reply;
 	u16 sc_status;
 
 	mpi_reply = (MPI2DefaultReply_t*)reply;
 	sc_status = le16toh(mpi_reply->IOCStatus);
 	if (sc_status & MPI2_IOCSTATUS_FLAG_LOG_INFO_AVAILABLE)
 		mps_sas_log_info(sc, le32toh(mpi_reply->IOCLogInfo));
 }
 void
 mps_intr(void *data)
 {
 	struct mps_softc *sc;
 	uint32_t status;
 
 	sc = (struct mps_softc *)data;
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	/*
 	 * Check interrupt status register to flush the bus.  This is
 	 * needed for both INTx interrupts and driver-driven polling
 	 */
 	status = mps_regread(sc, MPI2_HOST_INTERRUPT_STATUS_OFFSET);
 	if ((status & MPI2_HIS_REPLY_DESCRIPTOR_INTERRUPT) == 0)
 		return;
 
 	mps_lock(sc);
 	mps_intr_locked(data);
 	mps_unlock(sc);
 	return;
 }
 
 /*
  * In theory, MSI/MSIX interrupts shouldn't need to read any registers on the
  * chip.  Hopefully this theory is correct.
  */
 void
 mps_intr_msi(void *data)
 {
 	struct mps_softc *sc;
 
 	sc = (struct mps_softc *)data;
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 	mps_lock(sc);
 	mps_intr_locked(data);
 	mps_unlock(sc);
 	return;
 }
 
 /*
  * The locking is overly broad and simplistic, but easy to deal with for now.
  */
 void
 mps_intr_locked(void *data)
 {
 	MPI2_REPLY_DESCRIPTORS_UNION *desc;
 	MPI2_DIAG_RELEASE_REPLY *rel_rep;
 	mps_fw_diagnostic_buffer_t *pBuffer;
 	struct mps_softc *sc;
 	struct mps_command *cm = NULL;
 	uint64_t tdesc;
 	uint8_t flags;
 	u_int pq;
 
 	sc = (struct mps_softc *)data;
 
 	pq = sc->replypostindex;
 	mps_dprint(sc, MPS_TRACE,
 	    "%s sc %p starting with replypostindex %u\n", 
 	    __func__, sc, sc->replypostindex);
 
 	for ( ;; ) {
 		cm = NULL;
 		desc = &sc->post_queue[sc->replypostindex];
 
 		/*
 		 * Copy and clear out the descriptor so that any reentry will
 		 * immediately know that this descriptor has already been
 		 * looked at.  There is unfortunate casting magic because the
 		 * MPI API doesn't have a cardinal 64bit type.
 		 */
 		tdesc = 0xffffffffffffffff;
 		tdesc = atomic_swap_64((uint64_t *)desc, tdesc);
 		desc = (MPI2_REPLY_DESCRIPTORS_UNION *)&tdesc;
 
 		flags = desc->Default.ReplyFlags &
 		    MPI2_RPY_DESCRIPT_FLAGS_TYPE_MASK;
 		if ((flags == MPI2_RPY_DESCRIPT_FLAGS_UNUSED)
 		 || (le32toh(desc->Words.High) == 0xffffffff))
 			break;
 
 		/* increment the replypostindex now, so that event handlers
 		 * and cm completion handlers which decide to do a diag
 		 * reset can zero it without it getting incremented again
 		 * afterwards, and we break out of this loop on the next
 		 * iteration since the reply post queue has been cleared to
 		 * 0xFF and all descriptors look unused (which they are).
 		 */
 		if (++sc->replypostindex >= sc->pqdepth)
 			sc->replypostindex = 0;
 
 		switch (flags) {
 		case MPI2_RPY_DESCRIPT_FLAGS_SCSI_IO_SUCCESS:
 			cm = &sc->commands[le16toh(desc->SCSIIOSuccess.SMID)];
 			KASSERT(cm->cm_state == MPS_CM_STATE_INQUEUE,
 			    ("command not inqueue\n"));
 			cm->cm_state = MPS_CM_STATE_BUSY;
 			cm->cm_reply = NULL;
 			break;
 		case MPI2_RPY_DESCRIPT_FLAGS_ADDRESS_REPLY:
 		{
 			uint32_t baddr;
 			uint8_t *reply;
 
 			/*
 			 * Re-compose the reply address from the address
 			 * sent back from the chip.  The ReplyFrameAddress
 			 * is the lower 32 bits of the physical address of
 			 * particular reply frame.  Convert that address to
 			 * host format, and then use that to provide the
 			 * offset against the virtual address base
 			 * (sc->reply_frames).
 			 */
 			baddr = le32toh(desc->AddressReply.ReplyFrameAddress);
 			reply = sc->reply_frames +
 				(baddr - ((uint32_t)sc->reply_busaddr));
 			/*
 			 * Make sure the reply we got back is in a valid
 			 * range.  If not, go ahead and panic here, since
 			 * we'll probably panic as soon as we deference the
 			 * reply pointer anyway.
 			 */
 			if ((reply < sc->reply_frames)
 			 || (reply > (sc->reply_frames +
 			     (sc->fqdepth * sc->replyframesz)))) {
 				printf("%s: WARNING: reply %p out of range!\n",
 				       __func__, reply);
 				printf("%s: reply_frames %p, fqdepth %d, "
 				       "frame size %d\n", __func__,
 				       sc->reply_frames, sc->fqdepth,
 				       sc->replyframesz);
 				printf("%s: baddr %#x,\n", __func__, baddr);
 				/* LSI-TODO. See Linux Code for Graceful exit */
 				panic("Reply address out of range");
 			}
 			if (le16toh(desc->AddressReply.SMID) == 0) {
 				if (((MPI2_DEFAULT_REPLY *)reply)->Function ==
 				    MPI2_FUNCTION_DIAG_BUFFER_POST) {
 					/*
 					 * If SMID is 0 for Diag Buffer Post,
 					 * this implies that the reply is due to
 					 * a release function with a status that
 					 * the buffer has been released.  Set
 					 * the buffer flags accordingly.
 					 */
 					rel_rep =
 					    (MPI2_DIAG_RELEASE_REPLY *)reply;
 					if ((le16toh(rel_rep->IOCStatus) &
 					    MPI2_IOCSTATUS_MASK) ==
 					    MPI2_IOCSTATUS_DIAGNOSTIC_RELEASED)
 					{
 						pBuffer =
 						    &sc->fw_diag_buffer_list[
 						    rel_rep->BufferType];
 						pBuffer->valid_data = TRUE;
 						pBuffer->owned_by_firmware =
 						    FALSE;
 						pBuffer->immediate = FALSE;
 					}
 				} else
 					mps_dispatch_event(sc, baddr,
 					    (MPI2_EVENT_NOTIFICATION_REPLY *)
 					    reply);
 			} else {
 				/*
 				 * Ignore commands not in INQUEUE state
 				 * since they've already been completed
 				 * via another path.
 				 */
 				cm = &sc->commands[
 				    le16toh(desc->AddressReply.SMID)];
 				if (cm->cm_state == MPS_CM_STATE_INQUEUE) {
 					cm->cm_state = MPS_CM_STATE_BUSY;
 					cm->cm_reply = reply;
 					cm->cm_reply_data = le32toh(
 					    desc->AddressReply.ReplyFrameAddress);
 				} else {
 					mps_dprint(sc, MPS_RECOVERY,
 					    "Bad state for ADDRESS_REPLY status,"
 					    " ignoring state %d cm %p\n",
 					    cm->cm_state, cm);
 				}
 			}
 			break;
 		}
 		case MPI2_RPY_DESCRIPT_FLAGS_TARGETASSIST_SUCCESS:
 		case MPI2_RPY_DESCRIPT_FLAGS_TARGET_COMMAND_BUFFER:
 		case MPI2_RPY_DESCRIPT_FLAGS_RAID_ACCELERATOR_SUCCESS:
 		default:
 			/* Unhandled */
 			mps_dprint(sc, MPS_ERROR, "Unhandled reply 0x%x\n",
 			    desc->Default.ReplyFlags);
 			cm = NULL;
 			break;
 		}
 		
 
 		if (cm != NULL) {
 			// Print Error reply frame
 			if (cm->cm_reply)
 				mps_display_reply_info(sc,cm->cm_reply);
 			mps_complete_command(sc, cm);
 		}
 	}
 
 	if (pq != sc->replypostindex) {
 		mps_dprint(sc, MPS_TRACE, "%s sc %p writing postindex %d\n",
 		    __func__, sc, sc->replypostindex);
 		mps_regwrite(sc, MPI2_REPLY_POST_HOST_INDEX_OFFSET,
 		    sc->replypostindex);
 	}
 
 	return;
 }
 
 static void
 mps_dispatch_event(struct mps_softc *sc, uintptr_t data,
     MPI2_EVENT_NOTIFICATION_REPLY *reply)
 {
 	struct mps_event_handle *eh;
 	int event, handled = 0;
 
 	event = le16toh(reply->Event);
 	TAILQ_FOREACH(eh, &sc->event_list, eh_list) {
 		if (isset(eh->mask, event)) {
 			eh->callback(sc, data, reply);
 			handled++;
 		}
 	}
 
 	if (handled == 0)
 		mps_dprint(sc, MPS_EVENT, "Unhandled event 0x%x\n", le16toh(event));
 
 	/*
 	 * This is the only place that the event/reply should be freed.
 	 * Anything wanting to hold onto the event data should have
 	 * already copied it into their own storage.
 	 */
 	mps_free_reply(sc, data);
 }
 
 static void
 mps_reregister_events_complete(struct mps_softc *sc, struct mps_command *cm)
 {
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	if (cm->cm_reply)
 		MPS_DPRINT_EVENT(sc, generic,
 			(MPI2_EVENT_NOTIFICATION_REPLY *)cm->cm_reply);
 
 	mps_free_command(sc, cm);
 
 	/* next, send a port enable */
 	mpssas_startup(sc);
 }
 
 /*
  * For both register_events and update_events, the caller supplies a bitmap
  * of events that it _wants_.  These functions then turn that into a bitmask
  * suitable for the controller.
  */
 int
 mps_register_events(struct mps_softc *sc, u32 *mask,
     mps_evt_callback_t *cb, void *data, struct mps_event_handle **handle)
 {
 	struct mps_event_handle *eh;
 	int error = 0;
 
 	eh = malloc(sizeof(struct mps_event_handle), M_MPT2, M_WAITOK|M_ZERO);
 	eh->callback = cb;
 	eh->data = data;
 	TAILQ_INSERT_TAIL(&sc->event_list, eh, eh_list);
 	if (mask != NULL)
 		error = mps_update_events(sc, eh, mask);
 	*handle = eh;
 
 	return (error);
 }
 
 int
 mps_update_events(struct mps_softc *sc, struct mps_event_handle *handle,
     u32 *mask)
 {
 	MPI2_EVENT_NOTIFICATION_REQUEST *evtreq;
 	MPI2_EVENT_NOTIFICATION_REPLY *reply = NULL;
 	struct mps_command *cm;
 	int error, i;
 
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	if ((mask != NULL) && (handle != NULL))
 		bcopy(mask, &handle->mask[0], sizeof(u32) * 
 				MPI2_EVENT_NOTIFY_EVENTMASK_WORDS);
     
 	for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
 		sc->event_mask[i] = -1;
 
 	for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
 		sc->event_mask[i] &= ~handle->mask[i];
 
 	if ((cm = mps_alloc_command(sc)) == NULL)
 		return (EBUSY);
 	evtreq = (MPI2_EVENT_NOTIFICATION_REQUEST *)cm->cm_req;
 	evtreq->Function = MPI2_FUNCTION_EVENT_NOTIFICATION;
 	evtreq->MsgFlags = 0;
 	evtreq->SASBroadcastPrimitiveMasks = 0;
 #ifdef MPS_DEBUG_ALL_EVENTS
 	{
 		u_char fullmask[16];
 		memset(fullmask, 0x00, 16);
 		bcopy(fullmask, &evtreq->EventMasks[0], sizeof(u32) * 
 				MPI2_EVENT_NOTIFY_EVENTMASK_WORDS);
 	}
 #else
         for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
                 evtreq->EventMasks[i] =
                     htole32(sc->event_mask[i]);
 #endif
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_data = NULL;
 
 	error = mps_wait_command(sc, &cm, 60, 0);
 	if (cm != NULL)
 		reply = (MPI2_EVENT_NOTIFICATION_REPLY *)cm->cm_reply;
 	if ((reply == NULL) ||
 	    (reply->IOCStatus & MPI2_IOCSTATUS_MASK) != MPI2_IOCSTATUS_SUCCESS)
 		error = ENXIO;
 
 	if (reply)
 		MPS_DPRINT_EVENT(sc, generic, reply);
 
 	mps_dprint(sc, MPS_TRACE, "%s finished error %d\n", __func__, error);
 
 	if (cm != NULL)
 		mps_free_command(sc, cm);
 	return (error);
 }
 
 static int
 mps_reregister_events(struct mps_softc *sc)
 {
 	MPI2_EVENT_NOTIFICATION_REQUEST *evtreq;
 	struct mps_command *cm;
 	struct mps_event_handle *eh;
 	int error, i;
 
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	/* first, reregister events */
 
 	for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
 		sc->event_mask[i] = -1;
 
 	TAILQ_FOREACH(eh, &sc->event_list, eh_list) {
 		for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
 			sc->event_mask[i] &= ~eh->mask[i];
 	}
 
 	if ((cm = mps_alloc_command(sc)) == NULL)
 		return (EBUSY);
 	evtreq = (MPI2_EVENT_NOTIFICATION_REQUEST *)cm->cm_req;
 	evtreq->Function = MPI2_FUNCTION_EVENT_NOTIFICATION;
 	evtreq->MsgFlags = 0;
 	evtreq->SASBroadcastPrimitiveMasks = 0;
 #ifdef MPS_DEBUG_ALL_EVENTS
 	{
 		u_char fullmask[16];
 		memset(fullmask, 0x00, 16);
 		bcopy(fullmask, &evtreq->EventMasks[0], sizeof(u32) *
 			MPI2_EVENT_NOTIFY_EVENTMASK_WORDS);
 	}
 #else
         for (i = 0; i < MPI2_EVENT_NOTIFY_EVENTMASK_WORDS; i++)
                 evtreq->EventMasks[i] =
                     htole32(sc->event_mask[i]);
 #endif
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_data = NULL;
 	cm->cm_complete = mps_reregister_events_complete;
 
 	error = mps_map_command(sc, cm);
 
 	mps_dprint(sc, MPS_TRACE, "%s finished with error %d\n", __func__,
 	    error);
 	return (error);
 }
 
 void
 mps_deregister_events(struct mps_softc *sc, struct mps_event_handle *handle)
 {
 
 	TAILQ_REMOVE(&sc->event_list, handle, eh_list);
 	free(handle, M_MPT2);
 }
 
 /*
  * Add a chain element as the next SGE for the specified command.
  * Reset cm_sge and cm_sgesize to indicate all the available space.
  */
 static int
 mps_add_chain(struct mps_command *cm)
 {
 	MPI2_SGE_CHAIN32 *sgc;
 	struct mps_chain *chain;
 	u_int space;
 
 	if (cm->cm_sglsize < MPS_SGC_SIZE)
 		panic("MPS: Need SGE Error Code\n");
 
 	chain = mps_alloc_chain(cm->cm_sc);
 	if (chain == NULL)
 		return (ENOBUFS);
 
 	space = cm->cm_sc->reqframesz;
 
 	/*
 	 * Note: a double-linked list is used to make it easier to
 	 * walk for debugging.
 	 */
 	TAILQ_INSERT_TAIL(&cm->cm_chain_list, chain, chain_link);
 
 	sgc = (MPI2_SGE_CHAIN32 *)&cm->cm_sge->MpiChain;
 	sgc->Length = htole16(space);
 	sgc->NextChainOffset = 0;
 	/* TODO Looks like bug in Setting sgc->Flags. 
 	 *	sgc->Flags = ( MPI2_SGE_FLAGS_CHAIN_ELEMENT | MPI2_SGE_FLAGS_64_BIT_ADDRESSING |
 	 *	            MPI2_SGE_FLAGS_SYSTEM_ADDRESS) << MPI2_SGE_FLAGS_SHIFT
 	 *	This is fine.. because we are not using simple element. In case of 
 	 *	MPI2_SGE_CHAIN32, we have separate Length and Flags feild.
  	 */
 	sgc->Flags = MPI2_SGE_FLAGS_CHAIN_ELEMENT;
 	sgc->Address = htole32(chain->chain_busaddr);
 
 	cm->cm_sge = (MPI2_SGE_IO_UNION *)&chain->chain->MpiSimple;
 	cm->cm_sglsize = space;
 	return (0);
 }
 
 /*
  * Add one scatter-gather element (chain, simple, transaction context)
  * to the scatter-gather list for a command.  Maintain cm_sglsize and
  * cm_sge as the remaining size and pointer to the next SGE to fill
  * in, respectively.
  */
 int
 mps_push_sge(struct mps_command *cm, void *sgep, size_t len, int segsleft)
 {
 	MPI2_SGE_TRANSACTION_UNION *tc = sgep;
 	MPI2_SGE_SIMPLE64 *sge = sgep;
 	int error, type;
 	uint32_t saved_buf_len, saved_address_low, saved_address_high;
 
 	type = (tc->Flags & MPI2_SGE_FLAGS_ELEMENT_MASK);
 
 #ifdef INVARIANTS
 	switch (type) {
 	case MPI2_SGE_FLAGS_TRANSACTION_ELEMENT: {
 		if (len != tc->DetailsLength + 4)
 			panic("TC %p length %u or %zu?", tc,
 			    tc->DetailsLength + 4, len);
 		}
 		break;
 	case MPI2_SGE_FLAGS_CHAIN_ELEMENT:
 		/* Driver only uses 32-bit chain elements */
 		if (len != MPS_SGC_SIZE)
 			panic("CHAIN %p length %u or %zu?", sgep,
 			    MPS_SGC_SIZE, len);
 		break;
 	case MPI2_SGE_FLAGS_SIMPLE_ELEMENT:
 		/* Driver only uses 64-bit SGE simple elements */
 		if (len != MPS_SGE64_SIZE)
 			panic("SGE simple %p length %u or %zu?", sge,
 			    MPS_SGE64_SIZE, len);
 		if (((le32toh(sge->FlagsLength) >> MPI2_SGE_FLAGS_SHIFT) &
 		    MPI2_SGE_FLAGS_ADDRESS_SIZE) == 0)
 			panic("SGE simple %p not marked 64-bit?", sge);
 
 		break;
 	default:
 		panic("Unexpected SGE %p, flags %02x", tc, tc->Flags);
 	}
 #endif
 
 	/*
 	 * case 1: 1 more segment, enough room for it
 	 * case 2: 2 more segments, enough room for both
 	 * case 3: >=2 more segments, only enough room for 1 and a chain
 	 * case 4: >=1 more segment, enough room for only a chain
 	 * case 5: >=1 more segment, no room for anything (error)
          */
 
 	/*
 	 * There should be room for at least a chain element, or this
 	 * code is buggy.  Case (5).
 	 */
 	if (cm->cm_sglsize < MPS_SGC_SIZE)
 		panic("MPS: Need SGE Error Code\n");
 
 	if (segsleft >= 1 && cm->cm_sglsize < len + MPS_SGC_SIZE) {
 		/*
 		 * 1 or more segment, enough room for only a chain.
 		 * Hope the previous element wasn't a Simple entry
 		 * that needed to be marked with
 		 * MPI2_SGE_FLAGS_LAST_ELEMENT.  Case (4).
 		 */
 		if ((error = mps_add_chain(cm)) != 0)
 			return (error);
 	}
 
 	if (segsleft >= 2 &&
 	    cm->cm_sglsize < len + MPS_SGC_SIZE + MPS_SGE64_SIZE) {
 		/*
 		 * There are 2 or more segments left to add, and only
 		 * enough room for 1 and a chain.  Case (3).
 		 *
 		 * Mark as last element in this chain if necessary.
 		 */
 		if (type == MPI2_SGE_FLAGS_SIMPLE_ELEMENT) {
 			sge->FlagsLength |= htole32(
 			    MPI2_SGE_FLAGS_LAST_ELEMENT << MPI2_SGE_FLAGS_SHIFT);
 		}
 
 		/*
 		 * Add the item then a chain.  Do the chain now,
 		 * rather than on the next iteration, to simplify
 		 * understanding the code.
 		 */
 		cm->cm_sglsize -= len;
 		bcopy(sgep, cm->cm_sge, len);
 		cm->cm_sge = (MPI2_SGE_IO_UNION *)((uintptr_t)cm->cm_sge + len);
 		return (mps_add_chain(cm));
 	}
 
 #ifdef INVARIANTS
 	/* Case 1: 1 more segment, enough room for it. */
 	if (segsleft == 1 && cm->cm_sglsize < len)
 		panic("1 seg left and no room? %u versus %zu",
 		    cm->cm_sglsize, len);
 
 	/* Case 2: 2 more segments, enough room for both */
 	if (segsleft == 2 && cm->cm_sglsize < len + MPS_SGE64_SIZE)
 		panic("2 segs left and no room? %u versus %zu",
 		    cm->cm_sglsize, len);
 #endif
 
 	if (segsleft == 1 && type == MPI2_SGE_FLAGS_SIMPLE_ELEMENT) {
 		/*
 		 * If this is a bi-directional request, need to account for that
 		 * here.  Save the pre-filled sge values.  These will be used
 		 * either for the 2nd SGL or for a single direction SGL.  If
 		 * cm_out_len is non-zero, this is a bi-directional request, so
 		 * fill in the OUT SGL first, then the IN SGL, otherwise just
 		 * fill in the IN SGL.  Note that at this time, when filling in
 		 * 2 SGL's for a bi-directional request, they both use the same
 		 * DMA buffer (same cm command).
 		 */
 		saved_buf_len = le32toh(sge->FlagsLength) & 0x00FFFFFF;
 		saved_address_low = sge->Address.Low;
 		saved_address_high = sge->Address.High;
 		if (cm->cm_out_len) {
 			sge->FlagsLength = htole32(cm->cm_out_len |
 			    ((uint32_t)(MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 			    MPI2_SGE_FLAGS_END_OF_BUFFER |
 			    MPI2_SGE_FLAGS_HOST_TO_IOC |
 			    MPI2_SGE_FLAGS_64_BIT_ADDRESSING) <<
 			    MPI2_SGE_FLAGS_SHIFT));
 			cm->cm_sglsize -= len;
 			bcopy(sgep, cm->cm_sge, len);
 			cm->cm_sge = (MPI2_SGE_IO_UNION *)((uintptr_t)cm->cm_sge
 			    + len);
 		}
 		saved_buf_len |=
 		    ((uint32_t)(MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 		    MPI2_SGE_FLAGS_END_OF_BUFFER |
 		    MPI2_SGE_FLAGS_LAST_ELEMENT |
 		    MPI2_SGE_FLAGS_END_OF_LIST |
 		    MPI2_SGE_FLAGS_64_BIT_ADDRESSING) <<
 		    MPI2_SGE_FLAGS_SHIFT);
 		if (cm->cm_flags & MPS_CM_FLAGS_DATAIN) {
 			saved_buf_len |=
 			    ((uint32_t)(MPI2_SGE_FLAGS_IOC_TO_HOST) <<
 			    MPI2_SGE_FLAGS_SHIFT);
 		} else {
 			saved_buf_len |=
 			    ((uint32_t)(MPI2_SGE_FLAGS_HOST_TO_IOC) <<
 			    MPI2_SGE_FLAGS_SHIFT);
 		}
 		sge->FlagsLength = htole32(saved_buf_len);
 		sge->Address.Low = saved_address_low;
 		sge->Address.High = saved_address_high;
 	}
 
 	cm->cm_sglsize -= len;
 	bcopy(sgep, cm->cm_sge, len);
 	cm->cm_sge = (MPI2_SGE_IO_UNION *)((uintptr_t)cm->cm_sge + len);
 	return (0);
 }
 
 /*
  * Add one dma segment to the scatter-gather list for a command.
  */
 int
 mps_add_dmaseg(struct mps_command *cm, vm_paddr_t pa, size_t len, u_int flags,
     int segsleft)
 {
 	MPI2_SGE_SIMPLE64 sge;
 
 	/*
 	 * This driver always uses 64-bit address elements for simplicity.
 	 */
 	bzero(&sge, sizeof(sge));
 	flags |= MPI2_SGE_FLAGS_SIMPLE_ELEMENT |
 	    MPI2_SGE_FLAGS_64_BIT_ADDRESSING;
 	sge.FlagsLength = htole32(len | (flags << MPI2_SGE_FLAGS_SHIFT));
 	mps_from_u64(pa, &sge.Address);
 
 	return (mps_push_sge(cm, &sge, sizeof sge, segsleft));
 }
 
 static void
 mps_data_cb(void *arg, bus_dma_segment_t *segs, int nsegs, int error)
 {
 	struct mps_softc *sc;
 	struct mps_command *cm;
 	u_int i, dir, sflags;
 
 	cm = (struct mps_command *)arg;
 	sc = cm->cm_sc;
 
 	/*
 	 * In this case, just print out a warning and let the chip tell the
 	 * user they did the wrong thing.
 	 */
 	if ((cm->cm_max_segs != 0) && (nsegs > cm->cm_max_segs)) {
 		mps_dprint(sc, MPS_ERROR,
 			   "%s: warning: busdma returned %d segments, "
 			   "more than the %d allowed\n", __func__, nsegs,
 			   cm->cm_max_segs);
 	}
 
 	/*
 	 * Set up DMA direction flags.  Bi-directional requests are also handled
 	 * here.  In that case, both direction flags will be set.
 	 */
 	sflags = 0;
 	if (cm->cm_flags & MPS_CM_FLAGS_SMP_PASS) {
 		/*
 		 * We have to add a special case for SMP passthrough, there
 		 * is no easy way to generically handle it.  The first
 		 * S/G element is used for the command (therefore the
 		 * direction bit needs to be set).  The second one is used
 		 * for the reply.  We'll leave it to the caller to make
 		 * sure we only have two buffers.
 		 */
 		/*
 		 * Even though the busdma man page says it doesn't make
 		 * sense to have both direction flags, it does in this case.
 		 * We have one s/g element being accessed in each direction.
 		 */
 		dir = BUS_DMASYNC_PREWRITE | BUS_DMASYNC_PREREAD;
 
 		/*
 		 * Set the direction flag on the first buffer in the SMP
 		 * passthrough request.  We'll clear it for the second one.
 		 */
 		sflags |= MPI2_SGE_FLAGS_DIRECTION |
 			  MPI2_SGE_FLAGS_END_OF_BUFFER;
 	} else if (cm->cm_flags & MPS_CM_FLAGS_DATAOUT) {
 		sflags |= MPI2_SGE_FLAGS_HOST_TO_IOC;
 		dir = BUS_DMASYNC_PREWRITE;
 	} else
 		dir = BUS_DMASYNC_PREREAD;
 
 	for (i = 0; i < nsegs; i++) {
 		if ((cm->cm_flags & MPS_CM_FLAGS_SMP_PASS) && (i != 0)) {
 			sflags &= ~MPI2_SGE_FLAGS_DIRECTION;
 		}
 		error = mps_add_dmaseg(cm, segs[i].ds_addr, segs[i].ds_len,
 		    sflags, nsegs - i);
 		if (error != 0) {
 			/* Resource shortage, roll back! */
 			if (ratecheck(&sc->lastfail, &mps_chainfail_interval))
 				mps_dprint(sc, MPS_INFO, "Out of chain frames, "
 				    "consider increasing hw.mps.max_chains.\n");
 			cm->cm_flags |= MPS_CM_FLAGS_CHAIN_FAILED;
 			mps_complete_command(sc, cm);
 			return;
 		}
 	}
 
 	bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap, dir);
 	mps_enqueue_request(sc, cm);
 
 	return;
 }
 
 static void
 mps_data_cb2(void *arg, bus_dma_segment_t *segs, int nsegs, bus_size_t mapsize,
 	     int error)
 {
 	mps_data_cb(arg, segs, nsegs, error);
 }
 
 /*
  * This is the routine to enqueue commands ansynchronously.
  * Note that the only error path here is from bus_dmamap_load(), which can
  * return EINPROGRESS if it is waiting for resources.  Other than this, it's
  * assumed that if you have a command in-hand, then you have enough credits
  * to use it.
  */
 int
 mps_map_command(struct mps_softc *sc, struct mps_command *cm)
 {
 	int error = 0;
 
 	if (cm->cm_flags & MPS_CM_FLAGS_USE_UIO) {
 		error = bus_dmamap_load_uio(sc->buffer_dmat, cm->cm_dmamap,
 		    &cm->cm_uio, mps_data_cb2, cm, 0);
 	} else if (cm->cm_flags & MPS_CM_FLAGS_USE_CCB) {
 		error = bus_dmamap_load_ccb(sc->buffer_dmat, cm->cm_dmamap,
 		    cm->cm_data, mps_data_cb, cm, 0);
 	} else if ((cm->cm_data != NULL) && (cm->cm_length != 0)) {
 		error = bus_dmamap_load(sc->buffer_dmat, cm->cm_dmamap,
 		    cm->cm_data, cm->cm_length, mps_data_cb, cm, 0);
 	} else {
 		/* Add a zero-length element as needed */
 		if (cm->cm_sge != NULL)
 			mps_add_dmaseg(cm, 0, 0, 0, 1);
 		mps_enqueue_request(sc, cm);	
 	}
 
 	return (error);
 }
 
 /*
  * This is the routine to enqueue commands synchronously.  An error of
  * EINPROGRESS from mps_map_command() is ignored since the command will
  * be executed and enqueued automatically.  Other errors come from msleep().
  */
 int
 mps_wait_command(struct mps_softc *sc, struct mps_command **cmp, int timeout,
     int sleep_flag)
 {
 	int error, rc;
 	struct timeval cur_time, start_time;
 	struct mps_command *cm = *cmp;
 
 	if (sc->mps_flags & MPS_FLAGS_DIAGRESET) 
 		return  EBUSY;
 
 	cm->cm_complete = NULL;
 	cm->cm_flags |= MPS_CM_FLAGS_POLLED;
 	error = mps_map_command(sc, cm);
 	if ((error != 0) && (error != EINPROGRESS))
 		return (error);
 
 	/*
 	 * Check for context and wait for 50 mSec at a time until time has
 	 * expired or the command has finished.  If msleep can't be used, need
 	 * to poll.
 	 */
 	if (curthread->td_no_sleeping != 0)
 		sleep_flag = NO_SLEEP;
 	getmicrouptime(&start_time);
 	if (mtx_owned(&sc->mps_mtx) && sleep_flag == CAN_SLEEP) {
 		cm->cm_flags |= MPS_CM_FLAGS_WAKEUP;
 		error = msleep(cm, &sc->mps_mtx, 0, "mpswait", timeout*hz);
 		if (error == EWOULDBLOCK) {
 			/*
 			 * Record the actual elapsed time in the case of a
 			 * timeout for the message below.
 			 */
 			getmicrouptime(&cur_time);
 			timevalsub(&cur_time, &start_time);
 		}
 	} else {
 		while ((cm->cm_flags & MPS_CM_FLAGS_COMPLETE) == 0) {
 			mps_intr_locked(sc);
 			if (sleep_flag == CAN_SLEEP)
 				pause("mpswait", hz/20);
 			else
 				DELAY(50000);
 		
 			getmicrouptime(&cur_time);
 			timevalsub(&cur_time, &start_time);
 			if (cur_time.tv_sec > timeout) {
 				error = EWOULDBLOCK;
 				break;
 			}
 		}
 	}
 
 	if (error == EWOULDBLOCK) {
 		if (cm->cm_timeout_handler == NULL) {
 			mps_dprint(sc, MPS_FAULT, "Calling Reinit from %s, timeout=%d,"
 			    " elapsed=%jd\n", __func__, timeout,
 			    (intmax_t)cur_time.tv_sec);
 			rc = mps_reinit(sc);
 			mps_dprint(sc, MPS_FAULT, "Reinit %s\n", (rc == 0) ? "success" :
 			    "failed");
 		} else
 			cm->cm_timeout_handler(sc, cm);
 		if (sc->mps_flags & MPS_FLAGS_REALLOCATED) {
 			/*
 			 * Tell the caller that we freed the command in a
 			 * reinit.
 			 */
 			*cmp = NULL;
 		}
 		error = ETIMEDOUT;
 	}
 	return (error);
 }
 
 /*
  * The MPT driver had a verbose interface for config pages.  In this driver,
  * reduce it to much simpler terms, similar to the Linux driver.
  */
 int
 mps_read_config_page(struct mps_softc *sc, struct mps_config_params *params)
 {
 	MPI2_CONFIG_REQUEST *req;
 	struct mps_command *cm;
 	int error;
 
 	if (sc->mps_flags & MPS_FLAGS_BUSY) {
 		return (EBUSY);
 	}
 
 	cm = mps_alloc_command(sc);
 	if (cm == NULL) {
 		return (EBUSY);
 	}
 
 	req = (MPI2_CONFIG_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_CONFIG;
 	req->Action = params->action;
 	req->SGLFlags = 0;
 	req->ChainOffset = 0;
 	req->PageAddress = params->page_address;
 	if (params->hdr.Struct.PageType == MPI2_CONFIG_PAGETYPE_EXTENDED) {
 		MPI2_CONFIG_EXTENDED_PAGE_HEADER *hdr;
 
 		hdr = &params->hdr.Ext;
 		req->ExtPageType = hdr->ExtPageType;
 		req->ExtPageLength = hdr->ExtPageLength;
 		req->Header.PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 		req->Header.PageLength = 0; /* Must be set to zero */
 		req->Header.PageNumber = hdr->PageNumber;
 		req->Header.PageVersion = hdr->PageVersion;
 	} else {
 		MPI2_CONFIG_PAGE_HEADER *hdr;
 
 		hdr = &params->hdr.Struct;
 		req->Header.PageType = hdr->PageType;
 		req->Header.PageNumber = hdr->PageNumber;
 		req->Header.PageLength = hdr->PageLength;
 		req->Header.PageVersion = hdr->PageVersion;
 	}
 
 	cm->cm_data = params->buffer;
 	cm->cm_length = params->length;
 	if (cm->cm_data != NULL) {
 		cm->cm_sge = &req->PageBufferSGE;
 		cm->cm_sglsize = sizeof(MPI2_SGE_IO_UNION);
 		cm->cm_flags = MPS_CM_FLAGS_SGE_SIMPLE | MPS_CM_FLAGS_DATAIN;
 	} else
 		cm->cm_sge = NULL;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	cm->cm_complete_data = params;
 	if (params->callback != NULL) {
 		cm->cm_complete = mps_config_complete;
 		return (mps_map_command(sc, cm));
 	} else {
 		error = mps_wait_command(sc, &cm, 0, CAN_SLEEP);
 		if (error) {
 			mps_dprint(sc, MPS_FAULT,
 			    "Error %d reading config page\n", error);
 			if (cm != NULL)
 				mps_free_command(sc, cm);
 			return (error);
 		}
 		mps_config_complete(sc, cm);
 	}
 
 	return (0);
 }
 
 int
 mps_write_config_page(struct mps_softc *sc, struct mps_config_params *params)
 {
 	return (EINVAL);
 }
 
 static void
 mps_config_complete(struct mps_softc *sc, struct mps_command *cm)
 {
 	MPI2_CONFIG_REPLY *reply;
 	struct mps_config_params *params;
 
 	MPS_FUNCTRACE(sc);
 	params = cm->cm_complete_data;
 
 	if (cm->cm_data != NULL) {
 		bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap,
 		    BUS_DMASYNC_POSTREAD);
 		bus_dmamap_unload(sc->buffer_dmat, cm->cm_dmamap);
 	}
 
 	/*
 	 * XXX KDM need to do more error recovery?  This results in the
 	 * device in question not getting probed.
 	 */
 	if ((cm->cm_flags & MPS_CM_FLAGS_ERROR_MASK) != 0) {
 		params->status = MPI2_IOCSTATUS_BUSY;
 		goto done;
 	}
 
 	reply = (MPI2_CONFIG_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		params->status = MPI2_IOCSTATUS_BUSY;
 		goto done;
 	}
 	params->status = reply->IOCStatus;
 	if (params->hdr.Struct.PageType == MPI2_CONFIG_PAGETYPE_EXTENDED) {
 		params->hdr.Ext.ExtPageType = reply->ExtPageType;
 		params->hdr.Ext.ExtPageLength = reply->ExtPageLength;
 		params->hdr.Ext.PageType = reply->Header.PageType;
 		params->hdr.Ext.PageNumber = reply->Header.PageNumber;
 		params->hdr.Ext.PageVersion = reply->Header.PageVersion;
 	} else {
 		params->hdr.Struct.PageType = reply->Header.PageType;
 		params->hdr.Struct.PageNumber = reply->Header.PageNumber;
 		params->hdr.Struct.PageLength = reply->Header.PageLength;
 		params->hdr.Struct.PageVersion = reply->Header.PageVersion;
 	}
 
 done:
 	mps_free_command(sc, cm);
 	if (params->callback != NULL)
 		params->callback(sc, params);
 
 	return;
 }
Index: head/sys/dev/mps/mps_pci.c
===================================================================
--- head/sys/dev/mps/mps_pci.c	(revision 365705)
+++ head/sys/dev/mps/mps_pci.c	(revision 365706)
@@ -1,436 +1,436 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2009 Yahoo! Inc.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* PCI/PCI-X/PCIe bus interface for the Avago Tech (LSI) MPT2 controllers */
 
 /* TODO Move headers to mpsvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/malloc.h>
 #include <sys/sysctl.h>
 #include <sys/uio.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 
 #include <dev/pci/pcireg.h>
 #include <dev/pci/pcivar.h>
 #include <dev/pci/pci_private.h>
 
 #include <dev/mps/mpi/mpi2_type.h>
 #include <dev/mps/mpi/mpi2.h>
 #include <dev/mps/mpi/mpi2_ioc.h>
 #include <dev/mps/mpi/mpi2_cnfg.h>
 #include <dev/mps/mpi/mpi2_tool.h>
 
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <dev/mps/mps_ioctl.h>
 #include <dev/mps/mpsvar.h>
 
 static int	mps_pci_probe(device_t);
 static int	mps_pci_attach(device_t);
 static int	mps_pci_detach(device_t);
 static int	mps_pci_suspend(device_t);
 static int	mps_pci_resume(device_t);
 static void	mps_pci_free(struct mps_softc *);
 static int	mps_alloc_msix(struct mps_softc *sc, int msgs);
 static int	mps_alloc_msi(struct mps_softc *sc, int msgs);
 static int	mps_pci_alloc_interrupts(struct mps_softc *sc);
 
 static device_method_t mps_methods[] = {
 	DEVMETHOD(device_probe,		mps_pci_probe),
 	DEVMETHOD(device_attach,	mps_pci_attach),
 	DEVMETHOD(device_detach,	mps_pci_detach),
 	DEVMETHOD(device_suspend,	mps_pci_suspend),
 	DEVMETHOD(device_resume,	mps_pci_resume),
 
 	DEVMETHOD_END
 };
 
 static driver_t mps_pci_driver = {
 	"mps",
 	mps_methods,
 	sizeof(struct mps_softc)
 };
 
 struct mps_ident {
 	uint16_t	vendor;
 	uint16_t	device;
 	uint16_t	subvendor;
 	uint16_t	subdevice;
 	u_int		flags;
 	const char	*desc;
 } mps_identifiers[] = {
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2004,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2004" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2008,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2008" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2108_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2108" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2108_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2108" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2108_3,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2108" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2116_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2116" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2116_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2116" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_3,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_4,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_5,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2208_6,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2208" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_1,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2308" },
 	// Add Customer specific vender/subdevice id before generic
 	// (0xffff) vender/subdevice id.
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_2,
 	    0x8086, 0x3516, 0, "Intel(R) Integrated RAID Module RMS25JB080" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_2,
 	    0x8086, 0x3517, 0, "Intel(R) Integrated RAID Module RMS25JB040" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_2,
 	    0x8086, 0x3518, 0, "Intel(R) Integrated RAID Module RMS25KB080" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_2,
 	    0x8086, 0x3519, 0, "Intel(R) Integrated RAID Module RMS25KB040" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_2,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2308" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SAS2308_3,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SAS2308" },
 	{ MPI2_MFGPAGE_VENDORID_LSI, MPI2_MFGPAGE_DEVID_SSS6200,
 	    0xffff, 0xffff, 0, "Avago Technologies (LSI) SSS6200" },
 	{ 0, 0, 0, 0, 0, NULL }
 };
 
 static devclass_t	mps_devclass;
 DRIVER_MODULE(mps, pci, mps_pci_driver, mps_devclass, 0, 0);
 MODULE_DEPEND(mps, cam, 1, 1, 1);
 MODULE_PNP_INFO("U16:vendor;U16:device;U16:subvendor;U16:subdevice", pci, mps,
     mps_identifiers, nitems(mps_identifiers) - 1);
 static struct mps_ident *
 mps_find_ident(device_t dev)
 {
 	struct mps_ident *m;
 
 	for (m = mps_identifiers; m->vendor != 0; m++) {
 		if (m->vendor != pci_get_vendor(dev))
 			continue;
 		if (m->device != pci_get_device(dev))
 			continue;
 		if ((m->subvendor != 0xffff) &&
 		    (m->subvendor != pci_get_subvendor(dev)))
 			continue;
 		if ((m->subdevice != 0xffff) &&
 		    (m->subdevice != pci_get_subdevice(dev)))
 			continue;
 		return (m);
 	}
 
 	return (NULL);
 }
 
 static int
 mps_pci_probe(device_t dev)
 {
 	struct mps_ident *id;
 
 	if ((id = mps_find_ident(dev)) != NULL) {
 		device_set_desc(dev, id->desc);
 		return (BUS_PROBE_DEFAULT);
 	}
 	return (ENXIO);
 }
 
 static int
 mps_pci_attach(device_t dev)
 {
-	bus_dma_tag_template_t t;
+	bus_dma_template_t t;
 	struct mps_softc *sc;
 	struct mps_ident *m;
 	int error;
 
 	sc = device_get_softc(dev);
 	bzero(sc, sizeof(*sc));
 	sc->mps_dev = dev;
 	m = mps_find_ident(dev);
 	sc->mps_flags = m->flags;
 
 	mps_get_tunables(sc);
 
 	/* Twiddle basic PCI config bits for a sanity check */
 	pci_enable_busmaster(dev);
 
 	/* Allocate the System Interface Register Set */
 	sc->mps_regs_rid = PCIR_BAR(1);
 	if ((sc->mps_regs_resource = bus_alloc_resource_any(dev,
 	    SYS_RES_MEMORY, &sc->mps_regs_rid, RF_ACTIVE)) == NULL) {
 		mps_printf(sc, "Cannot allocate PCI registers\n");
 		return (ENXIO);
 	}
 	sc->mps_btag = rman_get_bustag(sc->mps_regs_resource);
 	sc->mps_bhandle = rman_get_bushandle(sc->mps_regs_resource);
 
 	/* Allocate the parent DMA tag */
 	bus_dma_template_init(&t, bus_get_dma_tag(dev));
 	if (bus_dma_template_tag(&t, &sc->mps_parent_dmat)) {
 		mps_printf(sc, "Cannot allocate parent DMA tag\n");
 		mps_pci_free(sc);
 		return (ENOMEM);
 	}
 
 	if (((error = mps_pci_alloc_interrupts(sc)) != 0) ||
 	    ((error = mps_attach(sc)) != 0))
 		mps_pci_free(sc);
 
 	return (error);
 }
 
 /*
  * Allocate, but don't assign interrupts early.  Doing it before requesting
  * the IOCFacts message informs the firmware that we want to do MSI-X
  * multiqueue.  We might not use all of the available messages, but there's
  * no reason to re-alloc if we don't.
  */
 static int
 mps_pci_alloc_interrupts(struct mps_softc *sc)
 {
 	device_t dev;
 	int error, msgs;
 
 	dev = sc->mps_dev;
 	error = 0;
 	msgs = 0;
 
 	if (sc->disable_msix == 0) {
 		msgs = pci_msix_count(dev);
 		mps_dprint(sc, MPS_INIT, "Counted %d MSI-X messages\n", msgs);
 		msgs = min(msgs, sc->max_msix);
 		msgs = min(msgs, MPS_MSIX_MAX);
 		msgs = min(msgs, 1);	/* XXX */
 		if (msgs != 0) {
 			mps_dprint(sc, MPS_INIT, "Attempting to allocate %d "
 			    "MSI-X messages\n", msgs);
 			error = mps_alloc_msix(sc, msgs);
 		}
 	}
 	if (((error != 0) || (msgs == 0)) && (sc->disable_msi == 0)) {
 		msgs = pci_msi_count(dev);
 		mps_dprint(sc, MPS_INIT, "Counted %d MSI messages\n", msgs);
 		msgs = min(msgs, MPS_MSI_MAX);
 		if (msgs != 0) {
 			mps_dprint(sc, MPS_INIT, "Attempting to allocate %d "
 			    "MSI messages\n", MPS_MSI_MAX);
 			error = mps_alloc_msi(sc, MPS_MSI_MAX);
 		}
 	}
 	if ((error != 0) || (msgs == 0)) {
 		/*
 		 * If neither MSI or MSI-X are avaiable, assume legacy INTx.
 		 * This also implies that there will be only 1 queue.
 		 */
 		mps_dprint(sc, MPS_INIT, "Falling back to legacy INTx\n");
 		sc->mps_flags |= MPS_FLAGS_INTX;
 		msgs = 1;
 	} else
 		sc->mps_flags |= MPS_FLAGS_MSI;
 
 	sc->msi_msgs = msgs;
 	mps_dprint(sc, MPS_INIT, "Allocated %d interrupts\n", msgs);
 
 	return (error);
 }
 
 int
 mps_pci_setup_interrupts(struct mps_softc *sc)
 {
 	device_t dev;
 	struct mps_queue *q;
 	void *ihandler;
 	int i, error, rid, initial_rid;
 
 	dev = sc->mps_dev;
 	error = ENXIO;
 
 	if (sc->mps_flags & MPS_FLAGS_INTX) {
 		initial_rid = 0;
 		ihandler = mps_intr;
 	} else if (sc->mps_flags & MPS_FLAGS_MSI) {
 		initial_rid = 1;
 		ihandler = mps_intr_msi;
 	} else {
 		mps_dprint(sc, MPS_ERROR|MPS_INIT,
 		    "Unable to set up interrupts\n");
 		return (EINVAL);
 	}
 
 	for (i = 0; i < sc->msi_msgs; i++) {
 		q = &sc->queues[i];
 		rid = i + initial_rid;
 		q->irq_rid = rid;
 		q->irq = bus_alloc_resource_any(dev, SYS_RES_IRQ,
 		    &q->irq_rid, RF_ACTIVE);
 		if (q->irq == NULL) {
 			mps_dprint(sc, MPS_ERROR|MPS_INIT,
 			    "Cannot allocate interrupt RID %d\n", rid);
 			sc->msi_msgs = i;
 			break;
 		}
 		error = bus_setup_intr(dev, q->irq,
 		    INTR_TYPE_BIO | INTR_MPSAFE, NULL, ihandler,
 		    sc, &q->intrhand);
 		if (error) {
 			mps_dprint(sc, MPS_ERROR|MPS_INIT,
 			    "Cannot setup interrupt RID %d\n", rid);
 			sc->msi_msgs = i;
 			break;
 		}
 	}
 
 	mps_dprint(sc, MPS_INIT, "Set up %d interrupts\n", sc->msi_msgs);
 
 	return (error);
 }
 
 static int
 mps_pci_detach(device_t dev)
 {
 	struct mps_softc *sc;
 	int error;
 
 	sc = device_get_softc(dev);
 
 	if ((error = mps_free(sc)) != 0)
 		return (error);
 
 	mps_pci_free(sc);
 	return (0);
 }
 
 void
 mps_pci_free_interrupts(struct mps_softc *sc)
 {
 	struct mps_queue *q;
 	int i;
 
 	if (sc->queues == NULL)
 		return;
 
 	for (i = 0; i < sc->msi_msgs; i++) {
 		q = &sc->queues[i];
 		if (q->irq != NULL) {
 			bus_teardown_intr(sc->mps_dev, q->irq,
 			    q->intrhand);
 			bus_release_resource(sc->mps_dev, SYS_RES_IRQ,
 			    q->irq_rid, q->irq);
 		}
 	}
 }
 
 static void
 mps_pci_free(struct mps_softc *sc)
 {
 
 	if (sc->mps_parent_dmat != NULL) {
 		bus_dma_tag_destroy(sc->mps_parent_dmat);
 	}
 
 	mps_pci_free_interrupts(sc);
 
 	if (sc->mps_flags & MPS_FLAGS_MSI)
 		pci_release_msi(sc->mps_dev);
 
 	if (sc->mps_regs_resource != NULL) {
 		bus_release_resource(sc->mps_dev, SYS_RES_MEMORY,
 		    sc->mps_regs_rid, sc->mps_regs_resource);
 	}
 
 	return;
 }
 
 static int
 mps_pci_suspend(device_t dev)
 {
 	return (EINVAL);
 }
 
 static int
 mps_pci_resume(device_t dev)
 {
 	return (EINVAL);
 }
 
 static int
 mps_alloc_msix(struct mps_softc *sc, int msgs)
 {
 	int error;
 
 	error = pci_alloc_msix(sc->mps_dev, &msgs);
 	return (error);
 }
 
 static int
 mps_alloc_msi(struct mps_softc *sc, int msgs)
 {
 	int error;
 
 	error = pci_alloc_msi(sc->mps_dev, &msgs);
 	return (error);
 }
 
 int
 mps_pci_restore(struct mps_softc *sc)
 {
 	struct pci_devinfo *dinfo;
 
 	mps_dprint(sc, MPS_TRACE, "%s\n", __func__);
 
 	dinfo = device_get_ivars(sc->mps_dev);
 	if (dinfo == NULL) {
 		mps_dprint(sc, MPS_FAULT, "%s: NULL dinfo\n", __func__);
 		return (EINVAL);
 	}
 
 	pci_cfg_restore(sc->mps_dev, dinfo);
 	return (0);
 }
Index: head/sys/dev/mps/mps_user.c
===================================================================
--- head/sys/dev/mps/mps_user.c	(revision 365705)
+++ head/sys/dev/mps/mps_user.c	(revision 365706)
@@ -1,2507 +1,2506 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 2008 Yahoo!, Inc.
  * All rights reserved.
  * Written by: John Baldwin <jhb@FreeBSD.org>
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the author nor the names of any co-contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Avago Technologies (LSI) MPT-Fusion Host Adapter FreeBSD userland interface
  */
 /*-
  * Copyright (c) 2011-2015 LSI Corp.
  * Copyright (c) 2013-2015 Avago Technologies
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * Avago Technologies (LSI) MPT-Fusion Host Adapter FreeBSD
  *
  * $FreeBSD$
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /* TODO Move headers to mpsvar */
 #include <sys/types.h>
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/selinfo.h>
 #include <sys/module.h>
 #include <sys/bus.h>
 #include <sys/conf.h>
 #include <sys/bio.h>
 #include <sys/abi_compat.h>
 #include <sys/malloc.h>
 #include <sys/uio.h>
 #include <sys/sysctl.h>
 #include <sys/ioccom.h>
 #include <sys/endian.h>
 #include <sys/queue.h>
 #include <sys/kthread.h>
 #include <sys/taskqueue.h>
 #include <sys/proc.h>
 #include <sys/sysent.h>
 
 #include <machine/bus.h>
 #include <machine/resource.h>
 #include <sys/rman.h>
 
 #include <cam/cam.h>
 #include <cam/cam_ccb.h>
 #include <cam/scsi/scsi_all.h>
 
 #include <dev/mps/mpi/mpi2_type.h>
 #include <dev/mps/mpi/mpi2.h>
 #include <dev/mps/mpi/mpi2_ioc.h>
 #include <dev/mps/mpi/mpi2_cnfg.h>
 #include <dev/mps/mpi/mpi2_init.h>
 #include <dev/mps/mpi/mpi2_tool.h>
 #include <dev/mps/mps_ioctl.h>
 #include <dev/mps/mpsvar.h>
 #include <dev/mps/mps_table.h>
 #include <dev/mps/mps_sas.h>
 #include <dev/pci/pcivar.h>
 #include <dev/pci/pcireg.h>
 
 static d_open_t		mps_open;
 static d_close_t	mps_close;
 static d_ioctl_t	mps_ioctl_devsw;
 
 static struct cdevsw mps_cdevsw = {
 	.d_version =	D_VERSION,
 	.d_flags =	0,
 	.d_open =	mps_open,
 	.d_close =	mps_close,
 	.d_ioctl =	mps_ioctl_devsw,
 	.d_name =	"mps",
 };
 
 typedef int (mps_user_f)(struct mps_command *, struct mps_usr_command *);
 static mps_user_f	mpi_pre_ioc_facts;
 static mps_user_f	mpi_pre_port_facts;
 static mps_user_f	mpi_pre_fw_download;
 static mps_user_f	mpi_pre_fw_upload;
 static mps_user_f	mpi_pre_sata_passthrough;
 static mps_user_f	mpi_pre_smp_passthrough;
 static mps_user_f	mpi_pre_config;
 static mps_user_f	mpi_pre_sas_io_unit_control;
 
 static int mps_user_read_cfg_header(struct mps_softc *,
 				    struct mps_cfg_page_req *);
 static int mps_user_read_cfg_page(struct mps_softc *,
 				  struct mps_cfg_page_req *, void *);
 static int mps_user_read_extcfg_header(struct mps_softc *,
 				     struct mps_ext_cfg_page_req *);
 static int mps_user_read_extcfg_page(struct mps_softc *,
 				     struct mps_ext_cfg_page_req *, void *);
 static int mps_user_write_cfg_page(struct mps_softc *,
 				   struct mps_cfg_page_req *, void *);
 static int mps_user_setup_request(struct mps_command *,
 				  struct mps_usr_command *);
 static int mps_user_command(struct mps_softc *, struct mps_usr_command *);
 
 static int mps_user_pass_thru(struct mps_softc *sc, mps_pass_thru_t *data);
 static void mps_user_get_adapter_data(struct mps_softc *sc,
     mps_adapter_data_t *data);
 static void mps_user_read_pci_info(struct mps_softc *sc,
     mps_pci_info_t *data);
 static uint8_t mps_get_fw_diag_buffer_number(struct mps_softc *sc,
     uint32_t unique_id);
 static int mps_post_fw_diag_buffer(struct mps_softc *sc,
     mps_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code);
 static int mps_release_fw_diag_buffer(struct mps_softc *sc,
     mps_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code,
     uint32_t diag_type);
 static int mps_diag_register(struct mps_softc *sc,
     mps_fw_diag_register_t *diag_register, uint32_t *return_code);
 static int mps_diag_unregister(struct mps_softc *sc,
     mps_fw_diag_unregister_t *diag_unregister, uint32_t *return_code);
 static int mps_diag_query(struct mps_softc *sc, mps_fw_diag_query_t *diag_query,
     uint32_t *return_code);
 static int mps_diag_read_buffer(struct mps_softc *sc,
     mps_diag_read_buffer_t *diag_read_buffer, uint8_t *ioctl_buf,
     uint32_t *return_code);
 static int mps_diag_release(struct mps_softc *sc,
     mps_fw_diag_release_t *diag_release, uint32_t *return_code);
 static int mps_do_diag_action(struct mps_softc *sc, uint32_t action,
     uint8_t *diag_action, uint32_t length, uint32_t *return_code);
 static int mps_user_diag_action(struct mps_softc *sc, mps_diag_action_t *data);
 static void mps_user_event_query(struct mps_softc *sc, mps_event_query_t *data);
 static void mps_user_event_enable(struct mps_softc *sc,
     mps_event_enable_t *data);
 static int mps_user_event_report(struct mps_softc *sc,
     mps_event_report_t *data);
 static int mps_user_reg_access(struct mps_softc *sc, mps_reg_access_t *data);
 static int mps_user_btdh(struct mps_softc *sc, mps_btdh_mapping_t *data);
 
 MALLOC_DEFINE(M_MPSUSER, "mps_user", "Buffers for mps(4) ioctls");
 
 int
 mps_attach_user(struct mps_softc *sc)
 {
 	int unit;
 
 	unit = device_get_unit(sc->mps_dev);
 	sc->mps_cdev = make_dev(&mps_cdevsw, unit, UID_ROOT, GID_OPERATOR, 0640,
 	    "mps%d", unit);
 	if (sc->mps_cdev == NULL) {
 		return (ENOMEM);
 	}
 	sc->mps_cdev->si_drv1 = sc;
 	return (0);
 }
 
 void
 mps_detach_user(struct mps_softc *sc)
 {
 
 	/* XXX: do a purge of pending requests? */
 	if (sc->mps_cdev != NULL)
 		destroy_dev(sc->mps_cdev);
 }
 
 static int
 mps_open(struct cdev *dev, int flags, int fmt, struct thread *td)
 {
 
 	return (0);
 }
 
 static int
 mps_close(struct cdev *dev, int flags, int fmt, struct thread *td)
 {
 
 	return (0);
 }
 
 static int
 mps_user_read_cfg_header(struct mps_softc *sc,
     struct mps_cfg_page_req *page_req)
 {
 	MPI2_CONFIG_PAGE_HEADER *hdr;
 	struct mps_config_params params;
 	int	    error;
 
 	hdr = &params.hdr.Struct;
 	params.action = MPI2_CONFIG_ACTION_PAGE_HEADER;
 	params.page_address = le32toh(page_req->page_address);
 	hdr->PageVersion = 0;
 	hdr->PageLength = 0;
 	hdr->PageNumber = page_req->header.PageNumber;
 	hdr->PageType = page_req->header.PageType;
 	params.buffer = NULL;
 	params.length = 0;
 	params.callback = NULL;
 
 	if ((error = mps_read_config_page(sc, &params)) != 0) {
 		/*
 		 * Leave the request. Without resetting the chip, it's
 		 * still owned by it and we'll just get into trouble
 		 * freeing it now. Mark it as abandoned so that if it
 		 * shows up later it can be freed.
 		 */
 		mps_printf(sc, "read_cfg_header timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	if ((page_req->ioc_status & MPI2_IOCSTATUS_MASK) ==
 	    MPI2_IOCSTATUS_SUCCESS) {
 		bcopy(hdr, &page_req->header, sizeof(page_req->header));
 	}
 
 	return (0);
 }
 
 static int
 mps_user_read_cfg_page(struct mps_softc *sc, struct mps_cfg_page_req *page_req,
     void *buf)
 {
 	MPI2_CONFIG_PAGE_HEADER *reqhdr, *hdr;
 	struct mps_config_params params;
 	int	      error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Struct;
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageLength = reqhdr->PageLength;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->PageType = reqhdr->PageType & MPI2_CONFIG_PAGETYPE_MASK;
 	params.action = MPI2_CONFIG_ACTION_PAGE_READ_CURRENT;
 	params.page_address = le32toh(page_req->page_address);
 	params.buffer = buf;
 	params.length = le32toh(page_req->len);
 	params.callback = NULL;
 
 	if ((error = mps_read_config_page(sc, &params)) != 0) {
 		mps_printf(sc, "mps_user_read_cfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 static int
 mps_user_read_extcfg_header(struct mps_softc *sc,
     struct mps_ext_cfg_page_req *ext_page_req)
 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER *hdr;
 	struct mps_config_params params;
 	int	    error;
 
 	hdr = &params.hdr.Ext;
 	params.action = MPI2_CONFIG_ACTION_PAGE_HEADER;
 	hdr->PageVersion = ext_page_req->header.PageVersion;
 	hdr->PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 	hdr->ExtPageLength = 0;
 	hdr->PageNumber = ext_page_req->header.PageNumber;
 	hdr->ExtPageType = ext_page_req->header.ExtPageType;
 	params.page_address = le32toh(ext_page_req->page_address);
 	params.buffer = NULL;
 	params.length = 0;
 	params.callback = NULL;
 
 	if ((error = mps_read_config_page(sc, &params)) != 0) {
 		/*
 		 * Leave the request. Without resetting the chip, it's
 		 * still owned by it and we'll just get into trouble
 		 * freeing it now. Mark it as abandoned so that if it
 		 * shows up later it can be freed.
 		 */
 		mps_printf(sc, "mps_user_read_extcfg_header timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	ext_page_req->ioc_status = htole16(params.status);
 	if ((ext_page_req->ioc_status & MPI2_IOCSTATUS_MASK) ==
 	    MPI2_IOCSTATUS_SUCCESS) {
 		ext_page_req->header.PageVersion = hdr->PageVersion;
 		ext_page_req->header.PageNumber = hdr->PageNumber;
 		ext_page_req->header.PageType = hdr->PageType;
 		ext_page_req->header.ExtPageLength = hdr->ExtPageLength;
 		ext_page_req->header.ExtPageType = hdr->ExtPageType;
 	}
 
 	return (0);
 }
 
 static int
 mps_user_read_extcfg_page(struct mps_softc *sc,
     struct mps_ext_cfg_page_req *ext_page_req, void *buf)
 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER *reqhdr, *hdr;
 	struct mps_config_params params;
 	int error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Ext;
 	params.action = MPI2_CONFIG_ACTION_PAGE_READ_CURRENT;
 	params.page_address = le32toh(ext_page_req->page_address);
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageType = MPI2_CONFIG_PAGETYPE_EXTENDED;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->ExtPageType = reqhdr->ExtPageType;
 	hdr->ExtPageLength = reqhdr->ExtPageLength;
 	params.buffer = buf;
 	params.length = le32toh(ext_page_req->len);
 	params.callback = NULL;
 
 	if ((error = mps_read_config_page(sc, &params)) != 0) {
 		mps_printf(sc, "mps_user_read_extcfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	ext_page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 static int
 mps_user_write_cfg_page(struct mps_softc *sc,
     struct mps_cfg_page_req *page_req, void *buf)
 {
 	MPI2_CONFIG_PAGE_HEADER *reqhdr, *hdr;
 	struct mps_config_params params;
 	u_int	      hdr_attr;
 	int	      error;
 
 	reqhdr = buf;
 	hdr = &params.hdr.Struct;
 	hdr_attr = reqhdr->PageType & MPI2_CONFIG_PAGEATTR_MASK;
 	if (hdr_attr != MPI2_CONFIG_PAGEATTR_CHANGEABLE &&
 	    hdr_attr != MPI2_CONFIG_PAGEATTR_PERSISTENT) {
 		mps_printf(sc, "page type 0x%x not changeable\n",
 			reqhdr->PageType & MPI2_CONFIG_PAGETYPE_MASK);
 		return (EINVAL);
 	}
 
 	/*
 	 * There isn't any point in restoring stripped out attributes
 	 * if you then mask them going down to issue the request.
 	 */
 
 	hdr->PageVersion = reqhdr->PageVersion;
 	hdr->PageLength = reqhdr->PageLength;
 	hdr->PageNumber = reqhdr->PageNumber;
 	hdr->PageType = reqhdr->PageType;
 	params.action = MPI2_CONFIG_ACTION_PAGE_WRITE_CURRENT;
 	params.page_address = le32toh(page_req->page_address);
 	params.buffer = buf;
 	params.length = le32toh(page_req->len);
 	params.callback = NULL;
 
 	if ((error = mps_write_config_page(sc, &params)) != 0) {
 		mps_printf(sc, "mps_write_cfg_page timed out\n");
 		return (ETIMEDOUT);
 	}
 
 	page_req->ioc_status = htole16(params.status);
 	return (0);
 }
 
 void
 mpi_init_sge(struct mps_command *cm, void *req, void *sge)
 {
 	int off, space;
 
 	space = (int)cm->cm_sc->reqframesz;
 	off = (uintptr_t)sge - (uintptr_t)req;
 
 	KASSERT(off < space, ("bad pointers %p %p, off %d, space %d",
             req, sge, off, space));
 
 	cm->cm_sge = sge;
 	cm->cm_sglsize = space - off;
 }
 
 /*
  * Prepare the mps_command for an IOC_FACTS request.
  */
 static int
 mpi_pre_ioc_facts(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_IOC_FACTS_REQUEST *req = (void *)cm->cm_req;
 	MPI2_IOC_FACTS_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * Prepare the mps_command for a PORT_FACTS request.
  */
 static int
 mpi_pre_port_facts(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_PORT_FACTS_REQUEST *req = (void *)cm->cm_req;
 	MPI2_PORT_FACTS_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * Prepare the mps_command for a FW_DOWNLOAD request.
  */
 static int
 mpi_pre_fw_download(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_FW_DOWNLOAD_REQUEST *req = (void *)cm->cm_req;
 	MPI2_FW_DOWNLOAD_REPLY *rpl;
 	MPI2_FW_DOWNLOAD_TCSGE tc;
 	int error;
 
 	/*
 	 * This code assumes there is room in the request's SGL for
 	 * the TransactionContext plus at least a SGL chain element.
 	 */
 	CTASSERT(sizeof req->SGL >= sizeof tc + MPS_SGC_SIZE);
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	if (cmd->len == 0)
 		return (EINVAL);
 
 	error = copyin(cmd->buf, cm->cm_data, cmd->len);
 	if (error != 0)
 		return (error);
 
 	mpi_init_sge(cm, req, &req->SGL);
 	bzero(&tc, sizeof tc);
 
 	/*
 	 * For now, the F/W image must be provided in a single request.
 	 */
 	if ((req->MsgFlags & MPI2_FW_DOWNLOAD_MSGFLGS_LAST_SEGMENT) == 0)
 		return (EINVAL);
 	if (req->TotalImageSize != cmd->len)
 		return (EINVAL);
 
 	/*
 	 * The value of the first two elements is specified in the
 	 * Fusion-MPT Message Passing Interface document.
 	 */
 	tc.ContextSize = 0;
 	tc.DetailsLength = 12;
 	tc.ImageOffset = 0;
 	tc.ImageSize = cmd->len;
 
 	cm->cm_flags |= MPS_CM_FLAGS_DATAOUT;
 
 	return (mps_push_sge(cm, &tc, sizeof tc, 0));
 }
 
 /*
  * Prepare the mps_command for a FW_UPLOAD request.
  */
 static int
 mpi_pre_fw_upload(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_FW_UPLOAD_REQUEST *req = (void *)cm->cm_req;
 	MPI2_FW_UPLOAD_REPLY *rpl;
 	MPI2_FW_UPLOAD_TCSGE tc;
 
 	/*
 	 * This code assumes there is room in the request's SGL for
 	 * the TransactionContext plus at least a SGL chain element.
 	 */
 	CTASSERT(sizeof req->SGL >= sizeof tc + MPS_SGC_SIZE);
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpi_init_sge(cm, req, &req->SGL);
 	bzero(&tc, sizeof tc);
 
 	/*
 	 * The value of the first two elements is specified in the
 	 * Fusion-MPT Message Passing Interface document.
 	 */
 	tc.ContextSize = 0;
 	tc.DetailsLength = 12;
 	/*
 	 * XXX Is there any reason to fetch a partial image?  I.e. to
 	 * set ImageOffset to something other than 0?
 	 */
 	tc.ImageOffset = 0;
 	tc.ImageSize = cmd->len;
 
 	cm->cm_flags |= MPS_CM_FLAGS_DATAIN;
 
 	return (mps_push_sge(cm, &tc, sizeof tc, 0));
 }
 
 /*
  * Prepare the mps_command for a SATA_PASSTHROUGH request.
  */
 static int
 mpi_pre_sata_passthrough(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_SATA_PASSTHROUGH_REQUEST *req = (void *)cm->cm_req;
 	MPI2_SATA_PASSTHROUGH_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpi_init_sge(cm, req, &req->SGL);
 	return (0);
 }
 
 /*
  * Prepare the mps_command for a SMP_PASSTHROUGH request.
  */
 static int
 mpi_pre_smp_passthrough(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_SMP_PASSTHROUGH_REQUEST *req = (void *)cm->cm_req;
 	MPI2_SMP_PASSTHROUGH_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpi_init_sge(cm, req, &req->SGL);
 	return (0);
 }
 
 /*
  * Prepare the mps_command for a CONFIG request.
  */
 static int
 mpi_pre_config(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_CONFIG_REQUEST *req = (void *)cm->cm_req;
 	MPI2_CONFIG_REPLY *rpl;
 
 	if (cmd->req_len != sizeof *req)
 		return (EINVAL);
 	if (cmd->rpl_len != sizeof *rpl)
 		return (EINVAL);
 
 	mpi_init_sge(cm, req, &req->PageBufferSGE);
 	return (0);
 }
 
 /*
  * Prepare the mps_command for a SAS_IO_UNIT_CONTROL request.
  */
 static int
 mpi_pre_sas_io_unit_control(struct mps_command *cm,
 			     struct mps_usr_command *cmd)
 {
 
 	cm->cm_sge = NULL;
 	cm->cm_sglsize = 0;
 	return (0);
 }
 
 /*
  * A set of functions to prepare an mps_command for the various
  * supported requests.
  */
 struct mps_user_func {
 	U8		Function;
 	mps_user_f	*f_pre;
 } mps_user_func_list[] = {
 	{ MPI2_FUNCTION_IOC_FACTS,		mpi_pre_ioc_facts },
 	{ MPI2_FUNCTION_PORT_FACTS,		mpi_pre_port_facts },
 	{ MPI2_FUNCTION_FW_DOWNLOAD, 		mpi_pre_fw_download },
 	{ MPI2_FUNCTION_FW_UPLOAD,		mpi_pre_fw_upload },
 	{ MPI2_FUNCTION_SATA_PASSTHROUGH,	mpi_pre_sata_passthrough },
 	{ MPI2_FUNCTION_SMP_PASSTHROUGH,	mpi_pre_smp_passthrough},
 	{ MPI2_FUNCTION_CONFIG,			mpi_pre_config},
 	{ MPI2_FUNCTION_SAS_IO_UNIT_CONTROL,	mpi_pre_sas_io_unit_control },
 	{ 0xFF,					NULL } /* list end */
 };
 
 static int
 mps_user_setup_request(struct mps_command *cm, struct mps_usr_command *cmd)
 {
 	MPI2_REQUEST_HEADER *hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;	
 	struct mps_user_func *f;
 
 	for (f = mps_user_func_list; f->f_pre != NULL; f++) {
 		if (hdr->Function == f->Function)
 			return (f->f_pre(cm, cmd));
 	}
 	return (EINVAL);
 }	
 
 static int
 mps_user_command(struct mps_softc *sc, struct mps_usr_command *cmd)
 {
 	MPI2_REQUEST_HEADER *hdr;	
 	MPI2_DEFAULT_REPLY *rpl;
 	void *buf = NULL;
 	struct mps_command *cm = NULL;
 	int err = 0;
 	int sz;
 
 	mps_lock(sc);
 	cm = mps_alloc_command(sc);
 
 	if (cm == NULL) {
 		mps_printf(sc, "%s: no mps requests\n", __func__);
 		err = ENOMEM;
 		goto RetFree;
 	}
 	mps_unlock(sc);
 
 	hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;
 
 	mps_dprint(sc, MPS_USER, "%s: req %p %d  rpl %p %d\n", __func__,
 	    cmd->req, cmd->req_len, cmd->rpl, cmd->rpl_len);
 
 	if (cmd->req_len > (int)sc->reqframesz) {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 	err = copyin(cmd->req, hdr, cmd->req_len);
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	mps_dprint(sc, MPS_USER, "%s: Function %02X MsgFlags %02X\n", __func__,
 	    hdr->Function, hdr->MsgFlags);
 
 	if (cmd->len > 0) {
 		buf = malloc(cmd->len, M_MPSUSER, M_WAITOK|M_ZERO);
 		cm->cm_data = buf;
 		cm->cm_length = cmd->len;
 	} else {
 		cm->cm_data = NULL;
 		cm->cm_length = 0;
 	}
 
 	cm->cm_flags = MPS_CM_FLAGS_SGE_SIMPLE;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	err = mps_user_setup_request(cm, cmd);
 	if (err == EINVAL) {
 		mps_printf(sc, "%s: unsupported parameter or unsupported "
 		    "function in request (function = 0x%X)\n", __func__,
 		    hdr->Function);
 	}
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	mps_lock(sc);
 	err = mps_wait_command(sc, &cm, 60, CAN_SLEEP);
 
 	if (err || (cm == NULL)) {
 		mps_printf(sc, "%s: invalid request: error %d\n",
 		    __func__, err);
 		goto RetFree;
 	}
 
 	rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 	if (rpl != NULL)
 		sz = rpl->MsgLength * 4;
 	else
 		sz = 0;
 
 	if (sz > cmd->rpl_len) {
 		mps_printf(sc, "%s: user reply buffer (%d) smaller than "
 		    "returned buffer (%d)\n", __func__, cmd->rpl_len, sz);
 		sz = cmd->rpl_len;
 	}	
 
 	mps_unlock(sc);
 	copyout(rpl, cmd->rpl, sz);
 	if (buf != NULL)
 		copyout(buf, cmd->buf, cmd->len);
 	mps_dprint(sc, MPS_USER, "%s: reply size %d\n", __func__, sz);
 
 RetFreeUnlocked:
 	mps_lock(sc);
 RetFree:
 	if (cm != NULL)
 		mps_free_command(sc, cm);
 	mps_unlock(sc);
 	if (buf != NULL)
 		free(buf, M_MPSUSER);
 	return (err);
 }
 
 static int
 mps_user_pass_thru(struct mps_softc *sc, mps_pass_thru_t *data)
 {
 	MPI2_REQUEST_HEADER	*hdr, tmphdr;	
 	MPI2_DEFAULT_REPLY	*rpl = NULL;
 	struct mps_command	*cm = NULL;
 	int			err = 0, dir = 0, sz;
 	uint8_t			function = 0;
 	u_int			sense_len;
 	struct mpssas_target	*targ = NULL;
 
 	/*
 	 * Only allow one passthru command at a time.  Use the MPS_FLAGS_BUSY
 	 * bit to denote that a passthru is being processed.
 	 */
 	mps_lock(sc);
 	if (sc->mps_flags & MPS_FLAGS_BUSY) {
 		mps_dprint(sc, MPS_USER, "%s: Only one passthru command "
 		    "allowed at a single time.", __func__);
 		mps_unlock(sc);
 		return (EBUSY);
 	}
 	sc->mps_flags |= MPS_FLAGS_BUSY;
 	mps_unlock(sc);
 
 	/*
 	 * Do some validation on data direction.  Valid cases are:
 	 *    1) DataSize is 0 and direction is NONE
 	 *    2) DataSize is non-zero and one of:
 	 *        a) direction is READ or
 	 *        b) direction is WRITE or
 	 *        c) direction is BOTH and DataOutSize is non-zero
 	 * If valid and the direction is BOTH, change the direction to READ.
 	 * if valid and the direction is not BOTH, make sure DataOutSize is 0.
 	 */
 	if (((data->DataSize == 0) &&
 	    (data->DataDirection == MPS_PASS_THRU_DIRECTION_NONE)) ||
 	    ((data->DataSize != 0) &&
 	    ((data->DataDirection == MPS_PASS_THRU_DIRECTION_READ) ||
 	    (data->DataDirection == MPS_PASS_THRU_DIRECTION_WRITE) ||
 	    ((data->DataDirection == MPS_PASS_THRU_DIRECTION_BOTH) &&
 	    (data->DataOutSize != 0))))) {
 		if (data->DataDirection == MPS_PASS_THRU_DIRECTION_BOTH)
 			data->DataDirection = MPS_PASS_THRU_DIRECTION_READ;
 		else
 			data->DataOutSize = 0;
 	} else {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 
 	mps_dprint(sc, MPS_USER, "%s: req 0x%jx %d  rpl 0x%jx %d "
 	    "data in 0x%jx %d data out 0x%jx %d data dir %d\n", __func__,
 	    data->PtrRequest, data->RequestSize, data->PtrReply,
 	    data->ReplySize, data->PtrData, data->DataSize,
 	    data->PtrDataOut, data->DataOutSize, data->DataDirection);
 
 	/*
 	 * copy in the header so we know what we're dealing with before we
 	 * commit to allocating a command for it.
 	 */
 	err = copyin(PTRIN(data->PtrRequest), &tmphdr, data->RequestSize);
 	if (err != 0)
 		goto RetFreeUnlocked;
 
 	if (data->RequestSize > (int)sc->reqframesz) {
 		err = EINVAL;
 		goto RetFreeUnlocked;
 	}
 
 	function = tmphdr.Function;
 	mps_dprint(sc, MPS_USER, "%s: Function %02X MsgFlags %02X\n", __func__,
 	    function, tmphdr.MsgFlags);
 
 	/*
 	 * Handle a passthru TM request.
 	 */
 	if (function == MPI2_FUNCTION_SCSI_TASK_MGMT) {
 		MPI2_SCSI_TASK_MANAGE_REQUEST	*task;
 
 		mps_lock(sc);
 		cm = mpssas_alloc_tm(sc);
 		if (cm == NULL) {
 			err = EINVAL;
 			goto Ret;
 		}
 
 		/* Copy the header in.  Only a small fixup is needed. */
 		task = (MPI2_SCSI_TASK_MANAGE_REQUEST *)cm->cm_req;
 		bcopy(&tmphdr, task, data->RequestSize);
 		task->TaskMID = cm->cm_desc.Default.SMID;
 
 		cm->cm_data = NULL;
 		cm->cm_complete = NULL;
 		cm->cm_complete_data = NULL;
 
 		targ = mpssas_find_target_by_handle(sc->sassc, 0,
 		    task->DevHandle);
 		if (targ == NULL) {
 			mps_dprint(sc, MPS_INFO,
 			   "%s %d : invalid handle for requested TM 0x%x \n",
 			   __func__, __LINE__, task->DevHandle);
 			err = 1;
 		} else {
 			mpssas_prepare_for_tm(sc, cm, targ, CAM_LUN_WILDCARD);
 			err = mps_wait_command(sc, &cm, 30, CAN_SLEEP);
 		}
 
 		if (err != 0) {
 			err = EIO;
 			mps_dprint(sc, MPS_FAULT, "%s: task management failed",
 			    __func__);
 		}
 		/*
 		 * Copy the reply data and sense data to user space.
 		 */
 		if ((cm != NULL) && (cm->cm_reply != NULL)) {
 			rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 			sz = rpl->MsgLength * 4;
 
 			if (sz > data->ReplySize) {
 				mps_printf(sc, "%s: user reply buffer (%d) "
 				    "smaller than returned buffer (%d)\n",
 				    __func__, data->ReplySize, sz);
 			}
 			mps_unlock(sc);
 			copyout(cm->cm_reply, PTRIN(data->PtrReply),
 			    data->ReplySize);
 			mps_lock(sc);
 		}
 		mpssas_free_tm(sc, cm);
 		goto Ret;
 	}
 
 	mps_lock(sc);
 	cm = mps_alloc_command(sc);
 
 	if (cm == NULL) {
 		mps_printf(sc, "%s: no mps requests\n", __func__);
 		err = ENOMEM;
 		goto Ret;
 	}
 	mps_unlock(sc);
 
 	hdr = (MPI2_REQUEST_HEADER *)cm->cm_req;
 	bcopy(&tmphdr, hdr, data->RequestSize);
 
 	/*
 	 * Do some checking to make sure the IOCTL request contains a valid
 	 * request.  Then set the SGL info.
 	 */
 	mpi_init_sge(cm, hdr, (void *)((uint8_t *)hdr + data->RequestSize));
 
 	/*
 	 * Set up for read, write or both.  From check above, DataOutSize will
 	 * be 0 if direction is READ or WRITE, but it will have some non-zero
 	 * value if the direction is BOTH.  So, just use the biggest size to get
 	 * the cm_data buffer size.  If direction is BOTH, 2 SGLs need to be set
 	 * up; the first is for the request and the second will contain the
 	 * response data. cm_out_len needs to be set here and this will be used
 	 * when the SGLs are set up.
 	 */
 	cm->cm_data = NULL;
 	cm->cm_length = MAX(data->DataSize, data->DataOutSize);
 	cm->cm_out_len = data->DataOutSize;
 	cm->cm_flags = 0;
 	if (cm->cm_length != 0) {
 		cm->cm_data = malloc(cm->cm_length, M_MPSUSER, M_WAITOK |
 		    M_ZERO);
 		cm->cm_flags = MPS_CM_FLAGS_DATAIN;
 		if (data->DataOutSize) {
 			cm->cm_flags |= MPS_CM_FLAGS_DATAOUT;
 			err = copyin(PTRIN(data->PtrDataOut),
 			    cm->cm_data, data->DataOutSize);
 		} else if (data->DataDirection ==
 		    MPS_PASS_THRU_DIRECTION_WRITE) {
 			cm->cm_flags = MPS_CM_FLAGS_DATAOUT;
 			err = copyin(PTRIN(data->PtrData),
 			    cm->cm_data, data->DataSize);
 		}
 		if (err != 0)
 			mps_dprint(sc, MPS_FAULT, "%s: failed to copy "
 			    "IOCTL data from user space\n", __func__);
 	}
 	cm->cm_flags |= MPS_CM_FLAGS_SGE_SIMPLE;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 
 	/*
 	 * Set up Sense buffer and SGL offset for IO passthru.  SCSI IO request
 	 * uses SCSI IO descriptor.
 	 */
 	if ((function == MPI2_FUNCTION_SCSI_IO_REQUEST) ||
 	    (function == MPI2_FUNCTION_RAID_SCSI_IO_PASSTHROUGH)) {
 		MPI2_SCSI_IO_REQUEST	*scsi_io_req;
 
 		scsi_io_req = (MPI2_SCSI_IO_REQUEST *)hdr;
 		/*
 		 * Put SGE for data and data_out buffer at the end of
 		 * scsi_io_request message header (64 bytes in total).
 		 * Following above SGEs, the residual space will be used by
 		 * sense data.
 		 */
 		scsi_io_req->SenseBufferLength = (uint8_t)(data->RequestSize -
 		    64);
 		scsi_io_req->SenseBufferLowAddress = htole32(cm->cm_sense_busaddr);
 
 		/*
 		 * Set SGLOffset0 value.  This is the number of dwords that SGL
 		 * is offset from the beginning of MPI2_SCSI_IO_REQUEST struct.
 		 */
 		scsi_io_req->SGLOffset0 = 24;
 
 		/*
 		 * Setup descriptor info.  RAID passthrough must use the
 		 * default request descriptor which is already set, so if this
 		 * is a SCSI IO request, change the descriptor to SCSI IO.
 		 * Also, if this is a SCSI IO request, handle the reply in the
 		 * mpssas_scsio_complete function.
 		 */
 		if (function == MPI2_FUNCTION_SCSI_IO_REQUEST) {
 			cm->cm_desc.SCSIIO.RequestFlags =
 			    MPI2_REQ_DESCRIPT_FLAGS_SCSI_IO;
 			cm->cm_desc.SCSIIO.DevHandle = scsi_io_req->DevHandle;
 
 			/*
 			 * Make sure the DevHandle is not 0 because this is a
 			 * likely error.
 			 */
 			if (scsi_io_req->DevHandle == 0) {
 				err = EINVAL;
 				goto RetFreeUnlocked;
 			}
 		}
 	}
 
 	mps_lock(sc);
 
 	err = mps_wait_command(sc, &cm, 30, CAN_SLEEP);
 
 	if (err || (cm == NULL)) {
 		mps_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    err);
 		mps_unlock(sc);
 		goto RetFreeUnlocked;
 	}
 
 	/*
 	 * Sync the DMA data, if any.  Then copy the data to user space.
 	 */
 	if (cm->cm_data != NULL) {
 		if (cm->cm_flags & MPS_CM_FLAGS_DATAIN)
 			dir = BUS_DMASYNC_POSTREAD;
 		else if (cm->cm_flags & MPS_CM_FLAGS_DATAOUT)
 			dir = BUS_DMASYNC_POSTWRITE;
 		bus_dmamap_sync(sc->buffer_dmat, cm->cm_dmamap, dir);
 		bus_dmamap_unload(sc->buffer_dmat, cm->cm_dmamap);
 
 		if (cm->cm_flags & MPS_CM_FLAGS_DATAIN) {
 			mps_unlock(sc);
 			err = copyout(cm->cm_data,
 			    PTRIN(data->PtrData), data->DataSize);
 			mps_lock(sc);
 			if (err != 0)
 				mps_dprint(sc, MPS_FAULT, "%s: failed to copy "
 				    "IOCTL data to user space\n", __func__);
 		}
 	}
 
 	/*
 	 * Copy the reply data and sense data to user space.
 	 */
 	if (cm->cm_reply != NULL) {
 		rpl = (MPI2_DEFAULT_REPLY *)cm->cm_reply;
 		sz = rpl->MsgLength * 4;
 
 		if (sz > data->ReplySize) {
 			mps_printf(sc, "%s: user reply buffer (%d) smaller "
 			    "than returned buffer (%d)\n", __func__,
 			    data->ReplySize, sz);
 		}
 		mps_unlock(sc);
 		copyout(cm->cm_reply, PTRIN(data->PtrReply), data->ReplySize);
 		mps_lock(sc);
 
 		if ((function == MPI2_FUNCTION_SCSI_IO_REQUEST) ||
 		    (function == MPI2_FUNCTION_RAID_SCSI_IO_PASSTHROUGH)) {
 			if (((MPI2_SCSI_IO_REPLY *)rpl)->SCSIState &
 			    MPI2_SCSI_STATE_AUTOSENSE_VALID) {
 				sense_len =
 				    MIN((le32toh(((MPI2_SCSI_IO_REPLY *)rpl)->
 				    SenseCount)), sizeof(struct
 				    scsi_sense_data));
 				mps_unlock(sc);
 				copyout(cm->cm_sense, (PTRIN(data->PtrReply +
 				    sizeof(MPI2_SCSI_IO_REPLY))), sense_len);
 				mps_lock(sc);
 			}
 		}
 	}
 	mps_unlock(sc);
 
 RetFreeUnlocked:
 	mps_lock(sc);
 
 	if (cm != NULL) {
 		if (cm->cm_data)
 			free(cm->cm_data, M_MPSUSER);
 		mps_free_command(sc, cm);
 	}
 Ret:
 	sc->mps_flags &= ~MPS_FLAGS_BUSY;
 	mps_unlock(sc);
 
 	return (err);
 }
 
 static void
 mps_user_get_adapter_data(struct mps_softc *sc, mps_adapter_data_t *data)
 {
 	Mpi2ConfigReply_t	mpi_reply;
 	Mpi2BiosPage3_t		config_page;
 
 	/*
 	 * Use the PCI interface functions to get the Bus, Device, and Function
 	 * information.
 	 */
 	data->PciInformation.u.bits.BusNumber = pci_get_bus(sc->mps_dev);
 	data->PciInformation.u.bits.DeviceNumber = pci_get_slot(sc->mps_dev);
 	data->PciInformation.u.bits.FunctionNumber =
 	    pci_get_function(sc->mps_dev);
 
 	/*
 	 * Get the FW version that should already be saved in IOC Facts.
 	 */
 	data->MpiFirmwareVersion = sc->facts->FWVersion.Word;
 
 	/*
 	 * General device info.
 	 */
 	data->AdapterType = MPSIOCTL_ADAPTER_TYPE_SAS2;
 	if (sc->mps_flags & MPS_FLAGS_WD_AVAILABLE)
 		data->AdapterType = MPSIOCTL_ADAPTER_TYPE_SAS2_SSS6200;
 	data->PCIDeviceHwId = pci_get_device(sc->mps_dev);
 	data->PCIDeviceHwRev = pci_read_config(sc->mps_dev, PCIR_REVID, 1);
 	data->SubSystemId = pci_get_subdevice(sc->mps_dev);
 	data->SubsystemVendorId = pci_get_subvendor(sc->mps_dev);
 
 	/*
 	 * Get the driver version.
 	 */
 	strcpy((char *)&data->DriverVersion[0], MPS_DRIVER_VERSION);
 
 	/*
 	 * Need to get BIOS Config Page 3 for the BIOS Version.
 	 */
 	data->BiosVersion = 0;
 	mps_lock(sc);
 	if (mps_config_get_bios_pg3(sc, &mpi_reply, &config_page))
 		printf("%s: Error while retrieving BIOS Version\n", __func__);
 	else
 		data->BiosVersion = config_page.BiosVersion;
 	mps_unlock(sc);
 }
 
 static void
 mps_user_read_pci_info(struct mps_softc *sc, mps_pci_info_t *data)
 {
 	int	i;
 
 	/*
 	 * Use the PCI interface functions to get the Bus, Device, and Function
 	 * information.
 	 */
 	data->BusNumber = pci_get_bus(sc->mps_dev);
 	data->DeviceNumber = pci_get_slot(sc->mps_dev);
 	data->FunctionNumber = pci_get_function(sc->mps_dev);
 
 	/*
 	 * Now get the interrupt vector and the pci header.  The vector can
 	 * only be 0 right now.  The header is the first 256 bytes of config
 	 * space.
 	 */
 	data->InterruptVector = 0;
 	for (i = 0; i < sizeof (data->PciHeader); i++) {
 		data->PciHeader[i] = pci_read_config(sc->mps_dev, i, 1);
 	}
 }
 
 static uint8_t
 mps_get_fw_diag_buffer_number(struct mps_softc *sc, uint32_t unique_id)
 {
 	uint8_t	index;
 
 	for (index = 0; index < MPI2_DIAG_BUF_TYPE_COUNT; index++) {
 		if (sc->fw_diag_buffer_list[index].unique_id == unique_id) {
 			return (index);
 		}
 	}
 
 	return (MPS_FW_DIAGNOSTIC_UID_NOT_FOUND);
 }
 
 static int
 mps_post_fw_diag_buffer(struct mps_softc *sc,
     mps_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code)
 {
 	MPI2_DIAG_BUFFER_POST_REQUEST	*req;
 	MPI2_DIAG_BUFFER_POST_REPLY	*reply = NULL;
 	struct mps_command		*cm = NULL;
 	int				i, status;
 
 	/*
 	 * If buffer is not enabled, just leave.
 	 */
 	*return_code = MPS_FW_DIAG_ERROR_POST_FAILED;
 	if (!pBuffer->enabled) {
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Clear some flags initially.
 	 */
 	pBuffer->force_release = FALSE;
 	pBuffer->valid_data = FALSE;
 	pBuffer->owned_by_firmware = FALSE;
 
 	/*
 	 * Get a command.
 	 */
 	cm = mps_alloc_command(sc);
 	if (cm == NULL) {
 		mps_printf(sc, "%s: no mps requests\n", __func__);
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Build the request for releasing the FW Diag Buffer and send it.
 	 */
 	req = (MPI2_DIAG_BUFFER_POST_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_DIAG_BUFFER_POST;
 	req->BufferType = pBuffer->buffer_type;
 	req->ExtendedType = pBuffer->extended_type;
 	req->BufferLength = pBuffer->size;
 	for (i = 0; i < (sizeof(req->ProductSpecific) / 4); i++)
 		req->ProductSpecific[i] = pBuffer->product_specific[i];
 	mps_from_u64(sc->fw_diag_busaddr, &req->BufferAddress);
 	cm->cm_data = NULL;
 	cm->cm_length = 0;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_complete_data = NULL;
 
 	/*
 	 * Send command synchronously.
 	 */
 	status = mps_wait_command(sc, &cm, 30, CAN_SLEEP);
 	if (status || (cm == NULL)) {
 		mps_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    status);
 		status = MPS_DIAG_FAILURE;
 		goto done;
 	}
 
 	/*
 	 * Process POST reply.
 	 */
 	reply = (MPI2_DIAG_BUFFER_POST_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		mps_printf(sc, "%s: reply is NULL, probably due to "
 		    "reinitialization\n", __func__);
 		status = MPS_DIAG_FAILURE;
 		goto done;
 	}
 	if ((le16toh(reply->IOCStatus) & MPI2_IOCSTATUS_MASK) !=
 	    MPI2_IOCSTATUS_SUCCESS) {
 		status = MPS_DIAG_FAILURE;
 		mps_dprint(sc, MPS_FAULT, "%s: post of FW  Diag Buffer failed "
 		    "with IOCStatus = 0x%x, IOCLogInfo = 0x%x and "
 		    "TransferLength = 0x%x\n", __func__,
 		    le16toh(reply->IOCStatus), le32toh(reply->IOCLogInfo),
 		    le32toh(reply->TransferLength));
 		goto done;
 	}
 
 	/*
 	 * Post was successful.
 	 */
 	pBuffer->valid_data = TRUE;
 	pBuffer->owned_by_firmware = TRUE;
 	*return_code = MPS_FW_DIAG_ERROR_SUCCESS;
 	status = MPS_DIAG_SUCCESS;
 
 done:
 	if (cm != NULL)
 		mps_free_command(sc, cm);
 	return (status);
 }
 
 static int
 mps_release_fw_diag_buffer(struct mps_softc *sc,
     mps_fw_diagnostic_buffer_t *pBuffer, uint32_t *return_code,
     uint32_t diag_type)
 {
 	MPI2_DIAG_RELEASE_REQUEST	*req;
 	MPI2_DIAG_RELEASE_REPLY		*reply = NULL;
 	struct mps_command		*cm = NULL;
 	int				status;
 
 	/*
 	 * If buffer is not enabled, just leave.
 	 */
 	*return_code = MPS_FW_DIAG_ERROR_RELEASE_FAILED;
 	if (!pBuffer->enabled) {
 		mps_dprint(sc, MPS_USER, "%s: This buffer type is not "
 		    "supported by the IOC", __func__);
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Clear some flags initially.
 	 */
 	pBuffer->force_release = FALSE;
 	pBuffer->valid_data = FALSE;
 	pBuffer->owned_by_firmware = FALSE;
 
 	/*
 	 * Get a command.
 	 */
 	cm = mps_alloc_command(sc);
 	if (cm == NULL) {
 		mps_printf(sc, "%s: no mps requests\n", __func__);
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Build the request for releasing the FW Diag Buffer and send it.
 	 */
 	req = (MPI2_DIAG_RELEASE_REQUEST *)cm->cm_req;
 	req->Function = MPI2_FUNCTION_DIAG_RELEASE;
 	req->BufferType = pBuffer->buffer_type;
 	cm->cm_data = NULL;
 	cm->cm_length = 0;
 	cm->cm_desc.Default.RequestFlags = MPI2_REQ_DESCRIPT_FLAGS_DEFAULT_TYPE;
 	cm->cm_complete_data = NULL;
 
 	/*
 	 * Send command synchronously.
 	 */
 	status = mps_wait_command(sc, &cm, 30, CAN_SLEEP);
 	if (status || (cm == NULL)) {
 		mps_printf(sc, "%s: invalid request: error %d\n", __func__,
 		    status);
 		status = MPS_DIAG_FAILURE;
 		goto done;
 	}
 
 	/*
 	 * Process RELEASE reply.
 	 */
 	reply = (MPI2_DIAG_RELEASE_REPLY *)cm->cm_reply;
 	if (reply == NULL) {
 		mps_printf(sc, "%s: reply is NULL, probably due to "
 		    "reinitialization\n", __func__);
 		status = MPS_DIAG_FAILURE;
 		goto done;
 	}
 	if (((le16toh(reply->IOCStatus) & MPI2_IOCSTATUS_MASK) !=
 	    MPI2_IOCSTATUS_SUCCESS) || pBuffer->owned_by_firmware) {
 		status = MPS_DIAG_FAILURE;
 		mps_dprint(sc, MPS_FAULT, "%s: release of FW Diag Buffer "
 		    "failed with IOCStatus = 0x%x and IOCLogInfo = 0x%x\n",
 		    __func__, le16toh(reply->IOCStatus),
 		    le32toh(reply->IOCLogInfo));
 		goto done;
 	}
 
 	/*
 	 * Release was successful.
 	 */
 	*return_code = MPS_FW_DIAG_ERROR_SUCCESS;
 	status = MPS_DIAG_SUCCESS;
 
 	/*
 	 * If this was for an UNREGISTER diag type command, clear the unique ID.
 	 */
 	if (diag_type == MPS_FW_DIAG_TYPE_UNREGISTER) {
 		pBuffer->unique_id = MPS_FW_DIAG_INVALID_UID;
 	}
 
 done:
 	if (cm != NULL)
 		mps_free_command(sc, cm);
 
 	return (status);
 }
 
 static int
 mps_diag_register(struct mps_softc *sc, mps_fw_diag_register_t *diag_register,
     uint32_t *return_code)
 {
-	bus_dma_tag_template_t		t;
+	bus_dma_template_t		t;
 	mps_fw_diagnostic_buffer_t	*pBuffer;
 	struct mps_busdma_context	*ctx;
 	uint8_t				extended_type, buffer_type, i;
 	uint32_t			buffer_size;
 	uint32_t			unique_id;
 	int				status;
 	int				error;
 
 	extended_type = diag_register->ExtendedType;
 	buffer_type = diag_register->BufferType;
 	buffer_size = diag_register->RequestedBufferSize;
 	unique_id = diag_register->UniqueId;
 	ctx = NULL;
 	error = 0;
 
 	/*
 	 * Check for valid buffer type
 	 */
 	if (buffer_type >= MPI2_DIAG_BUF_TYPE_COUNT) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should not be found.  If it is, the ID is already in use.
 	 */
 	i = mps_get_fw_diag_buffer_number(sc, unique_id);
 	pBuffer = &sc->fw_diag_buffer_list[buffer_type];
 	if (i != MPS_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * The buffer's unique ID should not be registered yet, and the given
 	 * unique ID cannot be 0.
 	 */
 	if ((pBuffer->unique_id != MPS_FW_DIAG_INVALID_UID) ||
 	    (unique_id == MPS_FW_DIAG_INVALID_UID)) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * If this buffer is already posted as immediate, just change owner.
 	 */
 	if (pBuffer->immediate && pBuffer->owned_by_firmware &&
 	    (pBuffer->unique_id == MPS_FW_DIAG_INVALID_UID)) {
 		pBuffer->immediate = FALSE;
 		pBuffer->unique_id = unique_id;
 		return (MPS_DIAG_SUCCESS);
 	}
 
 	/*
 	 * Post a new buffer after checking if it's enabled.  The DMA buffer
 	 * that is allocated will be contiguous (nsegments = 1).
 	 */
 	if (!pBuffer->enabled) {
 		*return_code = MPS_FW_DIAG_ERROR_NO_BUFFER;
 		return (MPS_DIAG_FAILURE);
 	}
 	bus_dma_template_init(&t, sc->mps_parent_dmat);
-	t.lowaddr = BUS_SPACE_MAXADDR_32BIT;
-	t.maxsize = t.maxsegsize = buffer_size;
-	t.nsegments = 1;
+	BUS_DMA_TEMPLATE_FILL(&t, BD_NSEGMENTS(1), BD_MAXSIZE(buffer_size),
+	    BD_MAXSEGSIZE(buffer_size), BD_LOWADDR(BUS_SPACE_MAXADDR_32BIT));
 	if (bus_dma_template_tag(&t, &sc->fw_diag_dmat)) {
 		mps_dprint(sc, MPS_ERROR,
 		    "Cannot allocate FW diag buffer DMA tag\n");
 		*return_code = MPS_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPS_DIAG_FAILURE;
 		goto bailout;
 	}
 	if (bus_dmamem_alloc(sc->fw_diag_dmat, (void **)&sc->fw_diag_buffer,
 	    BUS_DMA_NOWAIT, &sc->fw_diag_map)) {
 		mps_dprint(sc, MPS_ERROR,
 		    "Cannot allocate FW diag buffer memory\n");
 		*return_code = MPS_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPS_DIAG_FAILURE;
 		goto bailout;
         }
         bzero(sc->fw_diag_buffer, buffer_size);
 
 	ctx = malloc(sizeof(*ctx), M_MPSUSER, M_WAITOK | M_ZERO);
 	ctx->addr = &sc->fw_diag_busaddr;
 	ctx->buffer_dmat = sc->fw_diag_dmat;
 	ctx->buffer_dmamap = sc->fw_diag_map;
 	ctx->softc = sc;
         error = bus_dmamap_load(sc->fw_diag_dmat, sc->fw_diag_map,
 	    sc->fw_diag_buffer, buffer_size, mps_memaddr_wait_cb,
 	    ctx, 0);
 
 	if (error == EINPROGRESS) {
 		/* XXX KDM */
 		device_printf(sc->mps_dev, "%s: Deferred bus_dmamap_load\n",
 		    __func__);
 		/*
 		 * Wait for the load to complete.  If we're interrupted,
 		 * bail out.
 		 */
 		mps_lock(sc);
 		if (ctx->completed == 0) {
 			error = msleep(ctx, &sc->mps_mtx, PCATCH, "mpswait", 0);
 			if (error != 0) {
 				/*
 				 * We got an error from msleep(9).  This is
 				 * most likely due to a signal.  Tell
 				 * mpr_memaddr_wait_cb() that we've abandoned
 				 * the context, so it needs to clean up when
 				 * it is called.
 				 */
 				ctx->abandoned = 1;
 
 				/* The callback will free this memory */
 				ctx = NULL;
 				mps_unlock(sc);
 
 				device_printf(sc->mps_dev, "Cannot "
 				    "bus_dmamap_load FW diag buffer, error = "
 				    "%d returned from msleep\n", error);
 				*return_code = MPS_FW_DIAG_ERROR_NO_BUFFER;
 				status = MPS_DIAG_FAILURE;
 				goto bailout;
 			}
 		}
 		mps_unlock(sc);
 	} 
 
 	if ((error != 0) || (ctx->error != 0)) {
 		device_printf(sc->mps_dev, "Cannot bus_dmamap_load FW diag "
 		    "buffer, %serror = %d\n", error ? "" : "callback ",
 		    error ? error : ctx->error);
 		*return_code = MPS_FW_DIAG_ERROR_NO_BUFFER;
 		status = MPS_DIAG_FAILURE;
 		goto bailout;
 	}
 
 	bus_dmamap_sync(sc->fw_diag_dmat, sc->fw_diag_map, BUS_DMASYNC_PREREAD);
 
 	pBuffer->size = buffer_size;
 
 	/*
 	 * Copy the given info to the diag buffer and post the buffer.
 	 */
 	pBuffer->buffer_type = buffer_type;
 	pBuffer->immediate = FALSE;
 	if (buffer_type == MPI2_DIAG_BUF_TYPE_TRACE) {
 		for (i = 0; i < (sizeof (pBuffer->product_specific) / 4);
 		    i++) {
 			pBuffer->product_specific[i] =
 			    diag_register->ProductSpecific[i];
 		}
 	}
 	pBuffer->extended_type = extended_type;
 	pBuffer->unique_id = unique_id;
 	status = mps_post_fw_diag_buffer(sc, pBuffer, return_code);
 
 bailout:
 	/*
 	 * In case there was a failure, free the DMA buffer.
 	 */
 	if (status == MPS_DIAG_FAILURE) {
 		if (sc->fw_diag_busaddr != 0) {
 			bus_dmamap_unload(sc->fw_diag_dmat, sc->fw_diag_map);
 			sc->fw_diag_busaddr = 0;
 		}
 		if (sc->fw_diag_buffer != NULL) {
 			bus_dmamem_free(sc->fw_diag_dmat, sc->fw_diag_buffer,
 			    sc->fw_diag_map);
 			sc->fw_diag_buffer = NULL;
 		}
 		if (sc->fw_diag_dmat != NULL) {
 			bus_dma_tag_destroy(sc->fw_diag_dmat);
 			sc->fw_diag_dmat = NULL;
 		}
 	}
 
 	if (ctx != NULL)
 		free(ctx, M_MPSUSER);
 
 	return (status);
 }
 
 static int
 mps_diag_unregister(struct mps_softc *sc,
     mps_fw_diag_unregister_t *diag_unregister, uint32_t *return_code)
 {
 	mps_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_unregister->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mps_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPS_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * Try to release the buffer from FW before freeing it.  If release
 	 * fails, don't free the DMA buffer in case FW tries to access it
 	 * later.  If buffer is not owned by firmware, can't release it.
 	 */
 	if (!pBuffer->owned_by_firmware) {
 		status = MPS_DIAG_SUCCESS;
 	} else {
 		status = mps_release_fw_diag_buffer(sc, pBuffer, return_code,
 		    MPS_FW_DIAG_TYPE_UNREGISTER);
 	}
 
 	/*
 	 * At this point, return the current status no matter what happens with
 	 * the DMA buffer.
 	 */
 	pBuffer->unique_id = MPS_FW_DIAG_INVALID_UID;
 	if (status == MPS_DIAG_SUCCESS) {
 		if (sc->fw_diag_busaddr != 0) {
 			bus_dmamap_unload(sc->fw_diag_dmat, sc->fw_diag_map);
 			sc->fw_diag_busaddr = 0;
 		}
 		if (sc->fw_diag_buffer != NULL) {
 			bus_dmamem_free(sc->fw_diag_dmat, sc->fw_diag_buffer,
 			    sc->fw_diag_map);
 			sc->fw_diag_buffer = NULL;
 		}
 		if (sc->fw_diag_dmat != NULL) {
 			bus_dma_tag_destroy(sc->fw_diag_dmat);
 			sc->fw_diag_dmat = NULL;
 		}
 	}
 
 	return (status);
 }
 
 static int
 mps_diag_query(struct mps_softc *sc, mps_fw_diag_query_t *diag_query,
     uint32_t *return_code)
 {
 	mps_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 
 	unique_id = diag_query->UniqueId;
 
 	/*
 	 * If ID is valid, query on ID.
 	 * If ID is invalid, query on buffer type.
 	 */
 	if (unique_id == MPS_FW_DIAG_INVALID_UID) {
 		i = diag_query->BufferType;
 		if (i >= MPI2_DIAG_BUF_TYPE_COUNT) {
 			*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 			return (MPS_DIAG_FAILURE);
 		}
 	} else {
 		i = mps_get_fw_diag_buffer_number(sc, unique_id);
 		if (i == MPS_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 			*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 			return (MPS_DIAG_FAILURE);
 		}
 	}
 
 	/*
 	 * Fill query structure with the diag buffer info.
 	 */
 	pBuffer = &sc->fw_diag_buffer_list[i];
 	diag_query->BufferType = pBuffer->buffer_type;
 	diag_query->ExtendedType = pBuffer->extended_type;
 	if (diag_query->BufferType == MPI2_DIAG_BUF_TYPE_TRACE) {
 		for (i = 0; i < (sizeof(diag_query->ProductSpecific) / 4);
 		    i++) {
 			diag_query->ProductSpecific[i] =
 			    pBuffer->product_specific[i];
 		}
 	}
 	diag_query->TotalBufferSize = pBuffer->size;
 	diag_query->DriverAddedBufferSize = 0;
 	diag_query->UniqueId = pBuffer->unique_id;
 	diag_query->ApplicationFlags = 0;
 	diag_query->DiagnosticFlags = 0;
 
 	/*
 	 * Set/Clear application flags
 	 */
 	if (pBuffer->immediate) {
 		diag_query->ApplicationFlags &= ~MPS_FW_DIAG_FLAG_APP_OWNED;
 	} else {
 		diag_query->ApplicationFlags |= MPS_FW_DIAG_FLAG_APP_OWNED;
 	}
 	if (pBuffer->valid_data || pBuffer->owned_by_firmware) {
 		diag_query->ApplicationFlags |= MPS_FW_DIAG_FLAG_BUFFER_VALID;
 	} else {
 		diag_query->ApplicationFlags &= ~MPS_FW_DIAG_FLAG_BUFFER_VALID;
 	}
 	if (pBuffer->owned_by_firmware) {
 		diag_query->ApplicationFlags |=
 		    MPS_FW_DIAG_FLAG_FW_BUFFER_ACCESS;
 	} else {
 		diag_query->ApplicationFlags &=
 		    ~MPS_FW_DIAG_FLAG_FW_BUFFER_ACCESS;
 	}
 
 	return (MPS_DIAG_SUCCESS);
 }
 
 static int
 mps_diag_read_buffer(struct mps_softc *sc,
     mps_diag_read_buffer_t *diag_read_buffer, uint8_t *ioctl_buf,
     uint32_t *return_code)
 {
 	mps_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i, *pData;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_read_buffer->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mps_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPS_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * Make sure requested read is within limits
 	 */
 	if (diag_read_buffer->StartingOffset + diag_read_buffer->BytesToRead >
 	    pBuffer->size) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/* Sync the DMA map before we copy to userland. */
 	bus_dmamap_sync(sc->fw_diag_dmat, sc->fw_diag_map,
 	    BUS_DMASYNC_POSTREAD);
 
 	/*
 	 * Copy the requested data from DMA to the diag_read_buffer.  The DMA
 	 * buffer that was allocated is one contiguous buffer.
 	 */
 	pData = (uint8_t *)(sc->fw_diag_buffer +
 	    diag_read_buffer->StartingOffset);
 	if (copyout(pData, ioctl_buf, diag_read_buffer->BytesToRead) != 0)
 		return (MPS_DIAG_FAILURE);
 	diag_read_buffer->Status = 0;
 
 	/*
 	 * Set or clear the Force Release flag.
 	 */
 	if (pBuffer->force_release) {
 		diag_read_buffer->Flags |= MPS_FW_DIAG_FLAG_FORCE_RELEASE;
 	} else {
 		diag_read_buffer->Flags &= ~MPS_FW_DIAG_FLAG_FORCE_RELEASE;
 	}
 
 	/*
 	 * If buffer is to be reregistered, make sure it's not already owned by
 	 * firmware first.
 	 */
 	status = MPS_DIAG_SUCCESS;
 	if (!pBuffer->owned_by_firmware) {
 		if (diag_read_buffer->Flags & MPS_FW_DIAG_FLAG_REREGISTER) {
 			status = mps_post_fw_diag_buffer(sc, pBuffer,
 			    return_code);
 		}
 	}
 
 	return (status);
 }
 
 static int
 mps_diag_release(struct mps_softc *sc, mps_fw_diag_release_t *diag_release,
     uint32_t *return_code)
 {
 	mps_fw_diagnostic_buffer_t	*pBuffer;
 	uint8_t				i;
 	uint32_t			unique_id;
 	int				status;
 
 	unique_id = diag_release->UniqueId;
 
 	/*
 	 * Get the current buffer and look up the unique ID.  The unique ID
 	 * should be there.
 	 */
 	i = mps_get_fw_diag_buffer_number(sc, unique_id);
 	if (i == MPS_FW_DIAGNOSTIC_UID_NOT_FOUND) {
 		*return_code = MPS_FW_DIAG_ERROR_INVALID_UID;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	pBuffer = &sc->fw_diag_buffer_list[i];
 
 	/*
 	 * If buffer is not owned by firmware, it's already been released.
 	 */
 	if (!pBuffer->owned_by_firmware) {
 		*return_code = MPS_FW_DIAG_ERROR_ALREADY_RELEASED;
 		return (MPS_DIAG_FAILURE);
 	}
 
 	/*
 	 * Release the buffer.
 	 */
 	status = mps_release_fw_diag_buffer(sc, pBuffer, return_code,
 	    MPS_FW_DIAG_TYPE_RELEASE);
 	return (status);
 }
 
 static int
 mps_do_diag_action(struct mps_softc *sc, uint32_t action, uint8_t *diag_action,
     uint32_t length, uint32_t *return_code)
 {
 	mps_fw_diag_register_t		diag_register;
 	mps_fw_diag_unregister_t	diag_unregister;
 	mps_fw_diag_query_t		diag_query;
 	mps_diag_read_buffer_t		diag_read_buffer;
 	mps_fw_diag_release_t		diag_release;
 	int				status = MPS_DIAG_SUCCESS;
 	uint32_t			original_return_code;
 
 	original_return_code = *return_code;
 	*return_code = MPS_FW_DIAG_ERROR_SUCCESS;
 
 	switch (action) {
 		case MPS_FW_DIAG_TYPE_REGISTER:
 			if (!length) {
 				*return_code =
 				    MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPS_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_register,
 			    sizeof(diag_register)) != 0)
 				return (MPS_DIAG_FAILURE);
 			status = mps_diag_register(sc, &diag_register,
 			    return_code);
 			break;
 
 		case MPS_FW_DIAG_TYPE_UNREGISTER:
 			if (length < sizeof(diag_unregister)) {
 				*return_code =
 				    MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPS_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_unregister,
 			    sizeof(diag_unregister)) != 0)
 				return (MPS_DIAG_FAILURE);
 			status = mps_diag_unregister(sc, &diag_unregister,
 			    return_code);
 			break;
 
 		case MPS_FW_DIAG_TYPE_QUERY:
 			if (length < sizeof (diag_query)) {
 				*return_code =
 				    MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPS_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_query, sizeof(diag_query))
 			    != 0)
 				return (MPS_DIAG_FAILURE);
 			status = mps_diag_query(sc, &diag_query, return_code);
 			if (status == MPS_DIAG_SUCCESS)
 				if (copyout(&diag_query, diag_action,
 				    sizeof (diag_query)) != 0)
 					return (MPS_DIAG_FAILURE);
 			break;
 
 		case MPS_FW_DIAG_TYPE_READ_BUFFER:
 			if (copyin(diag_action, &diag_read_buffer,
 			    sizeof(diag_read_buffer)) != 0)
 				return (MPS_DIAG_FAILURE);
 			if (length < diag_read_buffer.BytesToRead) {
 				*return_code =
 				    MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPS_DIAG_FAILURE;
 				break;
 			}
 			status = mps_diag_read_buffer(sc, &diag_read_buffer,
 			    PTRIN(diag_read_buffer.PtrDataBuffer),
 			    return_code);
 			if (status == MPS_DIAG_SUCCESS) {
 				if (copyout(&diag_read_buffer, diag_action,
 				    sizeof(diag_read_buffer) -
 				    sizeof(diag_read_buffer.PtrDataBuffer)) !=
 				    0)
 					return (MPS_DIAG_FAILURE);
 			}
 			break;
 
 		case MPS_FW_DIAG_TYPE_RELEASE:
 			if (length < sizeof(diag_release)) {
 				*return_code =
 				    MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 				status = MPS_DIAG_FAILURE;
 				break;
 			}
 			if (copyin(diag_action, &diag_release,
 			    sizeof(diag_release)) != 0)
 				return (MPS_DIAG_FAILURE);
 			status = mps_diag_release(sc, &diag_release,
 			    return_code);
 			break;
 
 		default:
 			*return_code = MPS_FW_DIAG_ERROR_INVALID_PARAMETER;
 			status = MPS_DIAG_FAILURE;
 			break;
 	}
 
 	if ((status == MPS_DIAG_FAILURE) &&
 	    (original_return_code == MPS_FW_DIAG_NEW) &&
 	    (*return_code != MPS_FW_DIAG_ERROR_SUCCESS))
 		status = MPS_DIAG_SUCCESS;
 
 	return (status);
 }
 
 static int
 mps_user_diag_action(struct mps_softc *sc, mps_diag_action_t *data)
 {
 	int			status;
 
 	/*
 	 * Only allow one diag action at one time.
 	 */
 	if (sc->mps_flags & MPS_FLAGS_BUSY) {
 		mps_dprint(sc, MPS_USER, "%s: Only one FW diag command "
 		    "allowed at a single time.", __func__);
 		return (EBUSY);
 	}
 	sc->mps_flags |= MPS_FLAGS_BUSY;
 
 	/*
 	 * Send diag action request
 	 */
 	if (data->Action == MPS_FW_DIAG_TYPE_REGISTER ||
 	    data->Action == MPS_FW_DIAG_TYPE_UNREGISTER ||
 	    data->Action == MPS_FW_DIAG_TYPE_QUERY ||
 	    data->Action == MPS_FW_DIAG_TYPE_READ_BUFFER ||
 	    data->Action == MPS_FW_DIAG_TYPE_RELEASE) {
 		status = mps_do_diag_action(sc, data->Action,
 		    PTRIN(data->PtrDiagAction), data->Length,
 		    &data->ReturnCode);
 	} else
 		status = EINVAL;
 
 	sc->mps_flags &= ~MPS_FLAGS_BUSY;
 	return (status);
 }
 
 /*
  * Copy the event recording mask and the event queue size out.  For
  * clarification, the event recording mask (events_to_record) is not the same
  * thing as the event mask (event_mask).  events_to_record has a bit set for
  * every event type that is to be recorded by the driver, and event_mask has a
  * bit cleared for every event that is allowed into the driver from the IOC.
  * They really have nothing to do with each other.
  */
 static void
 mps_user_event_query(struct mps_softc *sc, mps_event_query_t *data)
 {
 	uint8_t	i;
 
 	mps_lock(sc);
 	data->Entries = MPS_EVENT_QUEUE_SIZE;
 
 	for (i = 0; i < 4; i++) {
 		data->Types[i] = sc->events_to_record[i];
 	}
 	mps_unlock(sc);
 }
 
 /*
  * Set the driver's event mask according to what's been given.  See
  * mps_user_event_query for explanation of the event recording mask and the IOC
  * event mask.  It's the app's responsibility to enable event logging by setting
  * the bits in events_to_record.  Initially, no events will be logged.
  */
 static void
 mps_user_event_enable(struct mps_softc *sc, mps_event_enable_t *data)
 {
 	uint8_t	i;
 
 	mps_lock(sc);
 	for (i = 0; i < 4; i++) {
 		sc->events_to_record[i] = data->Types[i];
 	}
 	mps_unlock(sc);
 }
 
 /*
  * Copy out the events that have been recorded, up to the max events allowed.
  */
 static int
 mps_user_event_report(struct mps_softc *sc, mps_event_report_t *data)
 {
 	int		status = 0;
 	uint32_t	size;
 
 	mps_lock(sc);
 	size = data->Size;
 	if ((size >= sizeof(sc->recorded_events)) && (status == 0)) {
 		mps_unlock(sc);
 		if (copyout((void *)sc->recorded_events,
 		    PTRIN(data->PtrEvents), size) != 0)
 			status = EFAULT;
 		mps_lock(sc);
 	} else {
 		/*
 		 * data->Size value is not large enough to copy event data.
 		 */
 		status = EFAULT;
 	}
 
 	/*
 	 * Change size value to match the number of bytes that were copied.
 	 */
 	if (status == 0)
 		data->Size = sizeof(sc->recorded_events);
 	mps_unlock(sc);
 
 	return (status);
 }
 
 /*
  * Record events into the driver from the IOC if they are not masked.
  */
 void
 mpssas_record_event(struct mps_softc *sc,
     MPI2_EVENT_NOTIFICATION_REPLY *event_reply)
 {
 	uint32_t	event;
 	int		i, j;
 	uint16_t	event_data_len;
 	boolean_t	sendAEN = FALSE;
 
 	event = event_reply->Event;
 
 	/*
 	 * Generate a system event to let anyone who cares know that a
 	 * LOG_ENTRY_ADDED event has occurred.  This is sent no matter what the
 	 * event mask is set to.
 	 */
 	if (event == MPI2_EVENT_LOG_ENTRY_ADDED) {
 		sendAEN = TRUE;
 	}
 
 	/*
 	 * Record the event only if its corresponding bit is set in
 	 * events_to_record.  event_index is the index into recorded_events and
 	 * event_number is the overall number of an event being recorded since
 	 * start-of-day.  event_index will roll over; event_number will never
 	 * roll over.
 	 */
 	i = (uint8_t)(event / 32);
 	j = (uint8_t)(event % 32);
 	if ((i < 4) && ((1 << j) & sc->events_to_record[i])) {
 		i = sc->event_index;
 		sc->recorded_events[i].Type = event;
 		sc->recorded_events[i].Number = ++sc->event_number;
 		bzero(sc->recorded_events[i].Data, MPS_MAX_EVENT_DATA_LENGTH *
 		    4);
 		event_data_len = event_reply->EventDataLength;
 
 		if (event_data_len > 0) {
 			/*
 			 * Limit data to size in m_event entry
 			 */
 			if (event_data_len > MPS_MAX_EVENT_DATA_LENGTH) {
 				event_data_len = MPS_MAX_EVENT_DATA_LENGTH;
 			}
 			for (j = 0; j < event_data_len; j++) {
 				sc->recorded_events[i].Data[j] =
 				    event_reply->EventData[j];
 			}
 
 			/*
 			 * check for index wrap-around
 			 */
 			if (++i == MPS_EVENT_QUEUE_SIZE) {
 				i = 0;
 			}
 			sc->event_index = (uint8_t)i;
 
 			/*
 			 * Set flag to send the event.
 			 */
 			sendAEN = TRUE;
 		}
 	}
 
 	/*
 	 * Generate a system event if flag is set to let anyone who cares know
 	 * that an event has occurred.
 	 */
 	if (sendAEN) {
 //SLM-how to send a system event (see kqueue, kevent)
 //		(void) ddi_log_sysevent(mpt->m_dip, DDI_VENDOR_LSI, "MPT_SAS",
 //		    "SAS", NULL, NULL, DDI_NOSLEEP);
 	}
 }
 
 static int
 mps_user_reg_access(struct mps_softc *sc, mps_reg_access_t *data)
 {
 	int	status = 0;
 
 	switch (data->Command) {
 		/*
 		 * IO access is not supported.
 		 */
 		case REG_IO_READ:
 		case REG_IO_WRITE:
 			mps_dprint(sc, MPS_USER, "IO access is not supported. "
 			    "Use memory access.");
 			status = EINVAL;
 			break;
 
 		case REG_MEM_READ:
 			data->RegData = mps_regread(sc, data->RegOffset);
 			break;
 
 		case REG_MEM_WRITE:
 			mps_regwrite(sc, data->RegOffset, data->RegData);
 			break;
 
 		default:
 			status = EINVAL;
 			break;
 	}
 
 	return (status);
 }
 
 static int
 mps_user_btdh(struct mps_softc *sc, mps_btdh_mapping_t *data)
 {
 	uint8_t		bt2dh = FALSE;
 	uint8_t		dh2bt = FALSE;
 	uint16_t	dev_handle, bus, target;
 
 	bus = data->Bus;
 	target = data->TargetID;
 	dev_handle = data->DevHandle;
 
 	/*
 	 * When DevHandle is 0xFFFF and Bus/Target are not 0xFFFF, use Bus/
 	 * Target to get DevHandle.  When Bus/Target are 0xFFFF and DevHandle is
 	 * not 0xFFFF, use DevHandle to get Bus/Target.  Anything else is
 	 * invalid.
 	 */
 	if ((bus == 0xFFFF) && (target == 0xFFFF) && (dev_handle != 0xFFFF))
 		dh2bt = TRUE;
 	if ((dev_handle == 0xFFFF) && (bus != 0xFFFF) && (target != 0xFFFF))
 		bt2dh = TRUE;
 	if (!dh2bt && !bt2dh)
 		return (EINVAL);
 
 	/*
 	 * Only handle bus of 0.  Make sure target is within range.
 	 */
 	if (bt2dh) {
 		if (bus != 0)
 			return (EINVAL);
 
 		if (target > sc->max_devices) {
 			mps_dprint(sc, MPS_FAULT, "Target ID is out of range "
 			   "for Bus/Target to DevHandle mapping.");
 			return (EINVAL);
 		}
 		dev_handle = sc->mapping_table[target].dev_handle;
 		if (dev_handle)
 			data->DevHandle = dev_handle;
 	} else {
 		bus = 0;
 		target = mps_mapping_get_tid_from_handle(sc, dev_handle);
 		data->Bus = bus;
 		data->TargetID = target;
 	}
 
 	return (0);
 }
 
 static int
 mps_ioctl(struct cdev *dev, u_long cmd, void *arg, int flag,
     struct thread *td)
 {
 	struct mps_softc *sc;
 	struct mps_cfg_page_req *page_req;
 	struct mps_ext_cfg_page_req *ext_page_req;
 	void *mps_page;
 	int error, msleep_ret;
 
 	mps_page = NULL;
 	sc = dev->si_drv1;
 	page_req = (void *)arg;
 	ext_page_req = (void *)arg;
 
 	switch (cmd) {
 	case MPSIO_READ_CFG_HEADER:
 		mps_lock(sc);
 		error = mps_user_read_cfg_header(sc, page_req);
 		mps_unlock(sc);
 		break;
 	case MPSIO_READ_CFG_PAGE:
 		mps_page = malloc(page_req->len, M_MPSUSER, M_WAITOK | M_ZERO);
 		error = copyin(page_req->buf, mps_page,
 		    sizeof(MPI2_CONFIG_PAGE_HEADER));
 		if (error)
 			break;
 		mps_lock(sc);
 		error = mps_user_read_cfg_page(sc, page_req, mps_page);
 		mps_unlock(sc);
 		if (error)
 			break;
 		error = copyout(mps_page, page_req->buf, page_req->len);
 		break;
 	case MPSIO_READ_EXT_CFG_HEADER:
 		mps_lock(sc);
 		error = mps_user_read_extcfg_header(sc, ext_page_req);
 		mps_unlock(sc);
 		break;
 	case MPSIO_READ_EXT_CFG_PAGE:
 		mps_page = malloc(ext_page_req->len, M_MPSUSER, M_WAITOK|M_ZERO);
 		error = copyin(ext_page_req->buf, mps_page,
 		    sizeof(MPI2_CONFIG_EXTENDED_PAGE_HEADER));
 		if (error)
 			break;
 		mps_lock(sc);
 		error = mps_user_read_extcfg_page(sc, ext_page_req, mps_page);
 		mps_unlock(sc);
 		if (error)
 			break;
 		error = copyout(mps_page, ext_page_req->buf, ext_page_req->len);
 		break;
 	case MPSIO_WRITE_CFG_PAGE:
 		mps_page = malloc(page_req->len, M_MPSUSER, M_WAITOK|M_ZERO);
 		error = copyin(page_req->buf, mps_page, page_req->len);
 		if (error)
 			break;
 		mps_lock(sc);
 		error = mps_user_write_cfg_page(sc, page_req, mps_page);
 		mps_unlock(sc);
 		break;
 	case MPSIO_MPS_COMMAND:
 		error = mps_user_command(sc, (struct mps_usr_command *)arg);
 		break;
 	case MPTIOCTL_PASS_THRU:
 		/*
 		 * The user has requested to pass through a command to be
 		 * executed by the MPT firmware.  Call our routine which does
 		 * this.  Only allow one passthru IOCTL at one time.
 		 */
 		error = mps_user_pass_thru(sc, (mps_pass_thru_t *)arg);
 		break;
 	case MPTIOCTL_GET_ADAPTER_DATA:
 		/*
 		 * The user has requested to read adapter data.  Call our
 		 * routine which does this.
 		 */
 		error = 0;
 		mps_user_get_adapter_data(sc, (mps_adapter_data_t *)arg);
 		break;
 	case MPTIOCTL_GET_PCI_INFO:
 		/*
 		 * The user has requested to read pci info.  Call
 		 * our routine which does this.
 		 */
 		mps_lock(sc);
 		error = 0;
 		mps_user_read_pci_info(sc, (mps_pci_info_t *)arg);
 		mps_unlock(sc);
 		break;
 	case MPTIOCTL_RESET_ADAPTER:
 		mps_lock(sc);
 		sc->port_enable_complete = 0;
 		uint32_t reinit_start = time_uptime;
 		error = mps_reinit(sc);
 		/* Sleep for 300 second. */
 		msleep_ret = msleep(&sc->port_enable_complete, &sc->mps_mtx, PRIBIO,
 		       "mps_porten", 300 * hz);
 		mps_unlock(sc);
 		if (msleep_ret)
 			printf("Port Enable did not complete after Diag "
 			    "Reset msleep error %d.\n", msleep_ret);
 		else
 			mps_dprint(sc, MPS_USER,
 				"Hard Reset with Port Enable completed in %d seconds.\n",
 				 (uint32_t) (time_uptime - reinit_start));
 		break;
 	case MPTIOCTL_DIAG_ACTION:
 		/*
 		 * The user has done a diag buffer action.  Call our routine
 		 * which does this.  Only allow one diag action at one time.
 		 */
 		mps_lock(sc);
 		error = mps_user_diag_action(sc, (mps_diag_action_t *)arg);
 		mps_unlock(sc);
 		break;
 	case MPTIOCTL_EVENT_QUERY:
 		/*
 		 * The user has done an event query. Call our routine which does
 		 * this.
 		 */
 		error = 0;
 		mps_user_event_query(sc, (mps_event_query_t *)arg);
 		break;
 	case MPTIOCTL_EVENT_ENABLE:
 		/*
 		 * The user has done an event enable. Call our routine which
 		 * does this.
 		 */
 		error = 0;
 		mps_user_event_enable(sc, (mps_event_enable_t *)arg);
 		break;
 	case MPTIOCTL_EVENT_REPORT:
 		/*
 		 * The user has done an event report. Call our routine which
 		 * does this.
 		 */
 		error = mps_user_event_report(sc, (mps_event_report_t *)arg);
 		break;
 	case MPTIOCTL_REG_ACCESS:
 		/*
 		 * The user has requested register access.  Call our routine
 		 * which does this.
 		 */
 		mps_lock(sc);
 		error = mps_user_reg_access(sc, (mps_reg_access_t *)arg);
 		mps_unlock(sc);
 		break;
 	case MPTIOCTL_BTDH_MAPPING:
 		/*
 		 * The user has requested to translate a bus/target to a
 		 * DevHandle or a DevHandle to a bus/target.  Call our routine
 		 * which does this.
 		 */
 		error = mps_user_btdh(sc, (mps_btdh_mapping_t *)arg);
 		break;
 	default:
 		error = ENOIOCTL;
 		break;
 	}
 
 	if (mps_page != NULL)
 		free(mps_page, M_MPSUSER);
 
 	return (error);
 }
 
 #ifdef COMPAT_FREEBSD32
 
 struct mps_cfg_page_req32 {
 	MPI2_CONFIG_PAGE_HEADER header;
 	uint32_t page_address;
 	uint32_t buf;
 	int	len;	
 	uint16_t ioc_status;
 };
 
 struct mps_ext_cfg_page_req32 {
 	MPI2_CONFIG_EXTENDED_PAGE_HEADER header;
 	uint32_t page_address;
 	uint32_t buf;
 	int	len;
 	uint16_t ioc_status;
 };
 
 struct mps_raid_action32 {
 	uint8_t action;
 	uint8_t volume_bus;
 	uint8_t volume_id;
 	uint8_t phys_disk_num;
 	uint32_t action_data_word;
 	uint32_t buf;
 	int len;
 	uint32_t volume_status;
 	uint32_t action_data[4];
 	uint16_t action_status;
 	uint16_t ioc_status;
 	uint8_t write;
 };
 
 struct mps_usr_command32 {
 	uint32_t req;
 	uint32_t req_len;
 	uint32_t rpl;
 	uint32_t rpl_len;
 	uint32_t buf;
 	int len;
 	uint32_t flags;
 };
 
 #define	MPSIO_READ_CFG_HEADER32	_IOWR('M', 200, struct mps_cfg_page_req32)
 #define	MPSIO_READ_CFG_PAGE32	_IOWR('M', 201, struct mps_cfg_page_req32)
 #define	MPSIO_READ_EXT_CFG_HEADER32 _IOWR('M', 202, struct mps_ext_cfg_page_req32)
 #define	MPSIO_READ_EXT_CFG_PAGE32 _IOWR('M', 203, struct mps_ext_cfg_page_req32)
 #define	MPSIO_WRITE_CFG_PAGE32	_IOWR('M', 204, struct mps_cfg_page_req32)
 #define	MPSIO_RAID_ACTION32	_IOWR('M', 205, struct mps_raid_action32)
 #define	MPSIO_MPS_COMMAND32	_IOWR('M', 210, struct mps_usr_command32)
 
 static int
 mps_ioctl32(struct cdev *dev, u_long cmd32, void *_arg, int flag,
     struct thread *td)
 {
 	struct mps_cfg_page_req32 *page32 = _arg;
 	struct mps_ext_cfg_page_req32 *ext32 = _arg;
 	struct mps_raid_action32 *raid32 = _arg;
 	struct mps_usr_command32 *user32 = _arg;
 	union {
 		struct mps_cfg_page_req page;
 		struct mps_ext_cfg_page_req ext;
 		struct mps_raid_action raid;
 		struct mps_usr_command user;
 	} arg;
 	u_long cmd;
 	int error;
 
 	switch (cmd32) {
 	case MPSIO_READ_CFG_HEADER32:
 	case MPSIO_READ_CFG_PAGE32:
 	case MPSIO_WRITE_CFG_PAGE32:
 		if (cmd32 == MPSIO_READ_CFG_HEADER32)
 			cmd = MPSIO_READ_CFG_HEADER;
 		else if (cmd32 == MPSIO_READ_CFG_PAGE32)
 			cmd = MPSIO_READ_CFG_PAGE;
 		else
 			cmd = MPSIO_WRITE_CFG_PAGE;
 		CP(*page32, arg.page, header);
 		CP(*page32, arg.page, page_address);
 		PTRIN_CP(*page32, arg.page, buf);
 		CP(*page32, arg.page, len);
 		CP(*page32, arg.page, ioc_status);
 		break;
 
 	case MPSIO_READ_EXT_CFG_HEADER32:
 	case MPSIO_READ_EXT_CFG_PAGE32:
 		if (cmd32 == MPSIO_READ_EXT_CFG_HEADER32)
 			cmd = MPSIO_READ_EXT_CFG_HEADER;
 		else
 			cmd = MPSIO_READ_EXT_CFG_PAGE;
 		CP(*ext32, arg.ext, header);
 		CP(*ext32, arg.ext, page_address);
 		PTRIN_CP(*ext32, arg.ext, buf);
 		CP(*ext32, arg.ext, len);
 		CP(*ext32, arg.ext, ioc_status);
 		break;
 
 	case MPSIO_RAID_ACTION32:
 		cmd = MPSIO_RAID_ACTION;
 		CP(*raid32, arg.raid, action);
 		CP(*raid32, arg.raid, volume_bus);
 		CP(*raid32, arg.raid, volume_id);
 		CP(*raid32, arg.raid, phys_disk_num);
 		CP(*raid32, arg.raid, action_data_word);
 		PTRIN_CP(*raid32, arg.raid, buf);
 		CP(*raid32, arg.raid, len);
 		CP(*raid32, arg.raid, volume_status);
 		bcopy(raid32->action_data, arg.raid.action_data,
 		    sizeof arg.raid.action_data);
 		CP(*raid32, arg.raid, ioc_status);
 		CP(*raid32, arg.raid, write);
 		break;
 
 	case MPSIO_MPS_COMMAND32:
 		cmd = MPSIO_MPS_COMMAND;
 		PTRIN_CP(*user32, arg.user, req);
 		CP(*user32, arg.user, req_len);
 		PTRIN_CP(*user32, arg.user, rpl);
 		CP(*user32, arg.user, rpl_len);
 		PTRIN_CP(*user32, arg.user, buf);
 		CP(*user32, arg.user, len);
 		CP(*user32, arg.user, flags);
 		break;
 	default:
 		return (ENOIOCTL);
 	}
 
 	error = mps_ioctl(dev, cmd, &arg, flag, td);
 	if (error == 0 && (cmd32 & IOC_OUT) != 0) {
 		switch (cmd32) {
 		case MPSIO_READ_CFG_HEADER32:
 		case MPSIO_READ_CFG_PAGE32:
 		case MPSIO_WRITE_CFG_PAGE32:
 			CP(arg.page, *page32, header);
 			CP(arg.page, *page32, page_address);
 			PTROUT_CP(arg.page, *page32, buf);
 			CP(arg.page, *page32, len);
 			CP(arg.page, *page32, ioc_status);
 			break;
 
 		case MPSIO_READ_EXT_CFG_HEADER32:
 		case MPSIO_READ_EXT_CFG_PAGE32:
 			CP(arg.ext, *ext32, header);
 			CP(arg.ext, *ext32, page_address);
 			PTROUT_CP(arg.ext, *ext32, buf);
 			CP(arg.ext, *ext32, len);
 			CP(arg.ext, *ext32, ioc_status);
 			break;
 
 		case MPSIO_RAID_ACTION32:
 			CP(arg.raid, *raid32, action);
 			CP(arg.raid, *raid32, volume_bus);
 			CP(arg.raid, *raid32, volume_id);
 			CP(arg.raid, *raid32, phys_disk_num);
 			CP(arg.raid, *raid32, action_data_word);
 			PTROUT_CP(arg.raid, *raid32, buf);
 			CP(arg.raid, *raid32, len);
 			CP(arg.raid, *raid32, volume_status);
 			bcopy(arg.raid.action_data, raid32->action_data,
 			    sizeof arg.raid.action_data);
 			CP(arg.raid, *raid32, ioc_status);
 			CP(arg.raid, *raid32, write);
 			break;
 
 		case MPSIO_MPS_COMMAND32:
 			PTROUT_CP(arg.user, *user32, req);
 			CP(arg.user, *user32, req_len);
 			PTROUT_CP(arg.user, *user32, rpl);
 			CP(arg.user, *user32, rpl_len);
 			PTROUT_CP(arg.user, *user32, buf);
 			CP(arg.user, *user32, len);
 			CP(arg.user, *user32, flags);
 			break;
 		}
 	}
 
 	return (error);
 }
 #endif /* COMPAT_FREEBSD32 */
 
 static int
 mps_ioctl_devsw(struct cdev *dev, u_long com, caddr_t arg, int flag,
     struct thread *td)
 {
 #ifdef COMPAT_FREEBSD32
 	if (SV_CURPROC_FLAG(SV_ILP32))
 		return (mps_ioctl32(dev, com, arg, flag, td));
 #endif
 	return (mps_ioctl(dev, com, arg, flag, td));
 }
Index: head/sys/kern/subr_bus_dma.c
===================================================================
--- head/sys/kern/subr_bus_dma.c	(revision 365705)
+++ head/sys/kern/subr_bus_dma.c	(revision 365706)
@@ -1,702 +1,787 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2012 EMC Corp.
  * All rights reserved.
  *
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include "opt_bus.h"
 
 #include <sys/param.h>
 #include <sys/conf.h>
 #include <sys/systm.h>
 #include <sys/bio.h>
 #include <sys/bus.h>
 #include <sys/callout.h>
 #include <sys/ktr.h>
 #include <sys/mbuf.h>
 #include <sys/memdesc.h>
 #include <sys/proc.h>
 #include <sys/uio.h>
 
 #include <vm/vm.h>
 #include <vm/vm_page.h>
 #include <vm/vm_map.h>
 #include <vm/pmap.h>
 
 #include <cam/cam.h>
 #include <cam/cam_ccb.h>
 
 #include <opencrypto/cryptodev.h>
 
 #include <machine/bus.h>
 
 /*
  * Load up data starting at offset within a region specified by a
  * list of virtual address ranges until either length or the region
  * are exhausted.
  */
 static int
 _bus_dmamap_load_vlist(bus_dma_tag_t dmat, bus_dmamap_t map,
     bus_dma_segment_t *list, int sglist_cnt, struct pmap *pmap, int *nsegs,
     int flags, size_t offset, size_t length)
 {
 	int error;
 
 	error = 0;
 	for (; sglist_cnt > 0 && length != 0; sglist_cnt--, list++) {
 		char *addr;
 		size_t ds_len;
 
 		KASSERT((offset < list->ds_len),
 		    ("Invalid mid-segment offset"));
 		addr = (char *)(uintptr_t)list->ds_addr + offset;
 		ds_len = list->ds_len - offset;
 		offset = 0;
 		if (ds_len > length)
 			ds_len = length;
 		length -= ds_len;
 		KASSERT((ds_len != 0), ("Segment length is zero"));
 		error = _bus_dmamap_load_buffer(dmat, map, addr, ds_len, pmap,
 		    flags, NULL, nsegs);
 		if (error)
 			break;
 	}
 	return (error);
 }
 
 /*
  * Load a list of physical addresses.
  */
 static int
 _bus_dmamap_load_plist(bus_dma_tag_t dmat, bus_dmamap_t map,
     bus_dma_segment_t *list, int sglist_cnt, int *nsegs, int flags)
 {
 	int error;
 
 	error = 0;
 	for (; sglist_cnt > 0; sglist_cnt--, list++) {
 		error = _bus_dmamap_load_phys(dmat, map,
 		    (vm_paddr_t)list->ds_addr, list->ds_len, flags, NULL,
 		    nsegs);
 		if (error)
 			break;
 	}
 	return (error);
 }
 
 /*
  * Load an unmapped mbuf
  */
 static int
 _bus_dmamap_load_mbuf_epg(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct mbuf *m, bus_dma_segment_t *segs, int *nsegs, int flags)
 {
 	int error, i, off, len, pglen, pgoff, seglen, segoff;
 
 	M_ASSERTEXTPG(m);
 
 	len = m->m_len;
 	error = 0;
 
 	/* Skip over any data removed from the front. */
 	off = mtod(m, vm_offset_t);
 
 	if (m->m_epg_hdrlen != 0) {
 		if (off >= m->m_epg_hdrlen) {
 			off -= m->m_epg_hdrlen;
 		} else {
 			seglen = m->m_epg_hdrlen - off;
 			segoff = off;
 			seglen = min(seglen, len);
 			off = 0;
 			len -= seglen;
 			error = _bus_dmamap_load_buffer(dmat, map,
 			    &m->m_epg_hdr[segoff], seglen, kernel_pmap,
 			    flags, segs, nsegs);
 		}
 	}
 	pgoff = m->m_epg_1st_off;
 	for (i = 0; i < m->m_epg_npgs && error == 0 && len > 0; i++) {
 		pglen = m_epg_pagelen(m, i, pgoff);
 		if (off >= pglen) {
 			off -= pglen;
 			pgoff = 0;
 			continue;
 		}
 		seglen = pglen - off;
 		segoff = pgoff + off;
 		off = 0;
 		seglen = min(seglen, len);
 		len -= seglen;
 		error = _bus_dmamap_load_phys(dmat, map,
 		    m->m_epg_pa[i] + segoff, seglen, flags, segs, nsegs);
 		pgoff = 0;
 	};
 	if (len != 0 && error == 0) {
 		KASSERT((off + len) <= m->m_epg_trllen,
 		    ("off + len > trail (%d + %d > %d)", off, len,
 		    m->m_epg_trllen));
 		error = _bus_dmamap_load_buffer(dmat, map,
 		    &m->m_epg_trail[off], len, kernel_pmap, flags, segs,
 		    nsegs);
 	}
 	return (error);
 }
 
 /*
  * Load an mbuf chain.
  */
 static int
 _bus_dmamap_load_mbuf_sg(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct mbuf *m0, bus_dma_segment_t *segs, int *nsegs, int flags)
 {
 	struct mbuf *m;
 	int error;
 
 	error = 0;
 	for (m = m0; m != NULL && error == 0; m = m->m_next) {
 		if (m->m_len > 0) {
 			if ((m->m_flags & M_EXTPG) != 0)
 				error = _bus_dmamap_load_mbuf_epg(dmat,
 				    map, m, segs, nsegs, flags);
 			else
 				error = _bus_dmamap_load_buffer(dmat, map,
 				    m->m_data, m->m_len, kernel_pmap,
 				    flags | BUS_DMA_LOAD_MBUF, segs, nsegs);
 		}
 	}
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, *nsegs);
 	return (error);
 }
 
 /*
  * Load from block io.
  */
 static int
 _bus_dmamap_load_bio(bus_dma_tag_t dmat, bus_dmamap_t map, struct bio *bio,
     int *nsegs, int flags)
 {
 
 	if ((bio->bio_flags & BIO_VLIST) != 0) {
 		bus_dma_segment_t *segs = (bus_dma_segment_t *)bio->bio_data;
 		return (_bus_dmamap_load_vlist(dmat, map, segs, bio->bio_ma_n,
 		    kernel_pmap, nsegs, flags, bio->bio_ma_offset,
 		    bio->bio_bcount));
 	}
 
 	if ((bio->bio_flags & BIO_UNMAPPED) != 0)
 		return (_bus_dmamap_load_ma(dmat, map, bio->bio_ma,
 		    bio->bio_bcount, bio->bio_ma_offset, flags, NULL, nsegs));
 
 	return (_bus_dmamap_load_buffer(dmat, map, bio->bio_data,
 	    bio->bio_bcount, kernel_pmap, flags, NULL, nsegs));
 }
 
 int
 bus_dmamap_load_ma_triv(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct vm_page **ma, bus_size_t tlen, int ma_offs, int flags,
     bus_dma_segment_t *segs, int *segp)
 {
 	vm_paddr_t paddr;
 	bus_size_t len;
 	int error, i;
 
 	error = 0;
 	for (i = 0; tlen > 0; i++, tlen -= len) {
 		len = min(PAGE_SIZE - ma_offs, tlen);
 		paddr = VM_PAGE_TO_PHYS(ma[i]) + ma_offs;
 		error = _bus_dmamap_load_phys(dmat, map, paddr, len,
 		    flags, segs, segp);
 		if (error != 0)
 			break;
 		ma_offs = 0;
 	}
 	return (error);
 }
 
 /*
  * Load a cam control block.
  */
 static int
 _bus_dmamap_load_ccb(bus_dma_tag_t dmat, bus_dmamap_t map, union ccb *ccb,
 		    int *nsegs, int flags)
 {
 	struct ccb_hdr *ccb_h;
 	void *data_ptr;
 	int error;
 	uint32_t dxfer_len;
 	uint16_t sglist_cnt;
 
 	error = 0;
 	ccb_h = &ccb->ccb_h;
 	switch (ccb_h->func_code) {
 	case XPT_SCSI_IO: {
 		struct ccb_scsiio *csio;
 
 		csio = &ccb->csio;
 		data_ptr = csio->data_ptr;
 		dxfer_len = csio->dxfer_len;
 		sglist_cnt = csio->sglist_cnt;
 		break;
 	}
 	case XPT_CONT_TARGET_IO: {
 		struct ccb_scsiio *ctio;
 
 		ctio = &ccb->ctio;
 		data_ptr = ctio->data_ptr;
 		dxfer_len = ctio->dxfer_len;
 		sglist_cnt = ctio->sglist_cnt;
 		break;
 	}
 	case XPT_ATA_IO: {
 		struct ccb_ataio *ataio;
 
 		ataio = &ccb->ataio;
 		data_ptr = ataio->data_ptr;
 		dxfer_len = ataio->dxfer_len;
 		sglist_cnt = 0;
 		break;
 	}
 	case XPT_NVME_IO:
 	case XPT_NVME_ADMIN: {
 		struct ccb_nvmeio *nvmeio;
 
 		nvmeio = &ccb->nvmeio;
 		data_ptr = nvmeio->data_ptr;
 		dxfer_len = nvmeio->dxfer_len;
 		sglist_cnt = nvmeio->sglist_cnt;
 		break;
 	}
 	default:
 		panic("_bus_dmamap_load_ccb: Unsupported func code %d",
 		    ccb_h->func_code);
 	}
 
 	switch ((ccb_h->flags & CAM_DATA_MASK)) {
 	case CAM_DATA_VADDR:
 		error = _bus_dmamap_load_buffer(dmat, map, data_ptr, dxfer_len,
 		    kernel_pmap, flags, NULL, nsegs);
 		break;
 	case CAM_DATA_PADDR:
 		error = _bus_dmamap_load_phys(dmat, map,
 		    (vm_paddr_t)(uintptr_t)data_ptr, dxfer_len, flags, NULL,
 		    nsegs);
 		break;
 	case CAM_DATA_SG:
 		error = _bus_dmamap_load_vlist(dmat, map,
 		    (bus_dma_segment_t *)data_ptr, sglist_cnt, kernel_pmap,
 		    nsegs, flags, 0, dxfer_len);
 		break;
 	case CAM_DATA_SG_PADDR:
 		error = _bus_dmamap_load_plist(dmat, map,
 		    (bus_dma_segment_t *)data_ptr, sglist_cnt, nsegs, flags);
 		break;
 	case CAM_DATA_BIO:
 		error = _bus_dmamap_load_bio(dmat, map, (struct bio *)data_ptr,
 		    nsegs, flags);
 		break;
 	default:
 		panic("_bus_dmamap_load_ccb: flags 0x%X unimplemented",
 		    ccb_h->flags);
 	}
 	return (error);
 }
 
 /*
  * Load a uio.
  */
 static int
 _bus_dmamap_load_uio(bus_dma_tag_t dmat, bus_dmamap_t map, struct uio *uio,
     int *nsegs, int flags)
 {
 	bus_size_t resid;
 	bus_size_t minlen;
 	struct iovec *iov;
 	pmap_t pmap;
 	caddr_t addr;
 	int error, i;
 
 	if (uio->uio_segflg == UIO_USERSPACE) {
 		KASSERT(uio->uio_td != NULL,
 			("bus_dmamap_load_uio: USERSPACE but no proc"));
 		pmap = vmspace_pmap(uio->uio_td->td_proc->p_vmspace);
 	} else
 		pmap = kernel_pmap;
 	resid = uio->uio_resid;
 	iov = uio->uio_iov;
 	error = 0;
 
 	for (i = 0; i < uio->uio_iovcnt && resid != 0 && !error; i++) {
 		/*
 		 * Now at the first iovec to load.  Load each iovec
 		 * until we have exhausted the residual count.
 		 */
 
 		addr = (caddr_t) iov[i].iov_base;
 		minlen = resid < iov[i].iov_len ? resid : iov[i].iov_len;
 		if (minlen > 0) {
 			error = _bus_dmamap_load_buffer(dmat, map, addr,
 			    minlen, pmap, flags, NULL, nsegs);
 			resid -= minlen;
 		}
 	}
 
 	return (error);
 }
 
 /*
  * Map the buffer buf into bus space using the dmamap map.
  */
 int
 bus_dmamap_load(bus_dma_tag_t dmat, bus_dmamap_t map, void *buf,
     bus_size_t buflen, bus_dmamap_callback_t *callback,
     void *callback_arg, int flags)
 {
 	bus_dma_segment_t *segs;
 	struct memdesc mem;
 	int error;
 	int nsegs;
 
 	if ((flags & BUS_DMA_NOWAIT) == 0) {
 		mem = memdesc_vaddr(buf, buflen);
 		_bus_dmamap_waitok(dmat, map, &mem, callback, callback_arg);
 	}
 
 	nsegs = -1;
 	error = _bus_dmamap_load_buffer(dmat, map, buf, buflen, kernel_pmap,
 	    flags, NULL, &nsegs);
 	nsegs++;
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 
 	if (error == EINPROGRESS)
 		return (error);
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, 0);
 
 	/*
 	 * Return ENOMEM to the caller so that it can pass it up the stack.
 	 * This error only happens when NOWAIT is set, so deferral is disabled.
 	 */
 	if (error == ENOMEM)
 		return (error);
 
 	return (0);
 }
 
 int
 bus_dmamap_load_mbuf(bus_dma_tag_t dmat, bus_dmamap_t map, struct mbuf *m0,
     bus_dmamap_callback2_t *callback, void *callback_arg, int flags)
 {
 	bus_dma_segment_t *segs;
 	int nsegs, error;
 
 	M_ASSERTPKTHDR(m0);
 
 	flags |= BUS_DMA_NOWAIT;
 	nsegs = -1;
 	error = _bus_dmamap_load_mbuf_sg(dmat, map, m0, NULL, &nsegs, flags);
 	++nsegs;
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, m0->m_pkthdr.len, error);
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 	return (error);
 }
 
 int
 bus_dmamap_load_mbuf_sg(bus_dma_tag_t dmat, bus_dmamap_t map, struct mbuf *m0,
     bus_dma_segment_t *segs, int *nsegs, int flags)
 {
 	int error;
 
 	flags |= BUS_DMA_NOWAIT;
 	*nsegs = -1;
 	error = _bus_dmamap_load_mbuf_sg(dmat, map, m0, segs, nsegs, flags);
 	++*nsegs;
 	_bus_dmamap_complete(dmat, map, segs, *nsegs, error);
 	return (error);
 }
 
 int
 bus_dmamap_load_uio(bus_dma_tag_t dmat, bus_dmamap_t map, struct uio *uio,
     bus_dmamap_callback2_t *callback, void *callback_arg, int flags)
 {
 	bus_dma_segment_t *segs;
 	int nsegs, error;
 
 	flags |= BUS_DMA_NOWAIT;
 	nsegs = -1;
 	error = _bus_dmamap_load_uio(dmat, map, uio, &nsegs, flags);
 	nsegs++;
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, uio->uio_resid, error);
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 	return (error);
 }
 
 int
 bus_dmamap_load_ccb(bus_dma_tag_t dmat, bus_dmamap_t map, union ccb *ccb,
 		    bus_dmamap_callback_t *callback, void *callback_arg,
 		    int flags)
 {
 	bus_dma_segment_t *segs;
 	struct ccb_hdr *ccb_h;
 	struct memdesc mem;
 	int error;
 	int nsegs;
 
 	ccb_h = &ccb->ccb_h;
 	if ((ccb_h->flags & CAM_DIR_MASK) == CAM_DIR_NONE) {
 		callback(callback_arg, NULL, 0, 0);
 		return (0);
 	}
 	if ((flags & BUS_DMA_NOWAIT) == 0) {
 		mem = memdesc_ccb(ccb);
 		_bus_dmamap_waitok(dmat, map, &mem, callback, callback_arg);
 	}
 	nsegs = -1;
 	error = _bus_dmamap_load_ccb(dmat, map, ccb, &nsegs, flags);
 	nsegs++;
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 
 	if (error == EINPROGRESS)
 		return (error);
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, error);
 	/*
 	 * Return ENOMEM to the caller so that it can pass it up the stack.
 	 * This error only happens when NOWAIT is set, so deferral is disabled.
 	 */
 	if (error == ENOMEM)
 		return (error);
 
 	return (0);
 }
 
 int
 bus_dmamap_load_bio(bus_dma_tag_t dmat, bus_dmamap_t map, struct bio *bio,
 		    bus_dmamap_callback_t *callback, void *callback_arg,
 		    int flags)
 {
 	bus_dma_segment_t *segs;
 	struct memdesc mem;
 	int error;
 	int nsegs;
 
 	if ((flags & BUS_DMA_NOWAIT) == 0) {
 		mem = memdesc_bio(bio);
 		_bus_dmamap_waitok(dmat, map, &mem, callback, callback_arg);
 	}
 	nsegs = -1;
 	error = _bus_dmamap_load_bio(dmat, map, bio, &nsegs, flags);
 	nsegs++;
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 
 	if (error == EINPROGRESS)
 		return (error);
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, error);
 	/*
 	 * Return ENOMEM to the caller so that it can pass it up the stack.
 	 * This error only happens when NOWAIT is set, so deferral is disabled.
 	 */
 	if (error == ENOMEM)
 		return (error);
 
 	return (0);
 }
 
 int
 bus_dmamap_load_mem(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct memdesc *mem, bus_dmamap_callback_t *callback,
     void *callback_arg, int flags)
 {
 	bus_dma_segment_t *segs;
 	int error;
 	int nsegs;
 
 	if ((flags & BUS_DMA_NOWAIT) == 0)
 		_bus_dmamap_waitok(dmat, map, mem, callback, callback_arg);
 
 	nsegs = -1;
 	error = 0;
 	switch (mem->md_type) {
 	case MEMDESC_VADDR:
 		error = _bus_dmamap_load_buffer(dmat, map, mem->u.md_vaddr,
 		    mem->md_opaque, kernel_pmap, flags, NULL, &nsegs);
 		break;
 	case MEMDESC_PADDR:
 		error = _bus_dmamap_load_phys(dmat, map, mem->u.md_paddr,
 		    mem->md_opaque, flags, NULL, &nsegs);
 		break;
 	case MEMDESC_VLIST:
 		error = _bus_dmamap_load_vlist(dmat, map, mem->u.md_list,
 		    mem->md_opaque, kernel_pmap, &nsegs, flags, 0, SIZE_T_MAX);
 		break;
 	case MEMDESC_PLIST:
 		error = _bus_dmamap_load_plist(dmat, map, mem->u.md_list,
 		    mem->md_opaque, &nsegs, flags);
 		break;
 	case MEMDESC_BIO:
 		error = _bus_dmamap_load_bio(dmat, map, mem->u.md_bio,
 		    &nsegs, flags);
 		break;
 	case MEMDESC_UIO:
 		error = _bus_dmamap_load_uio(dmat, map, mem->u.md_uio,
 		    &nsegs, flags);
 		break;
 	case MEMDESC_MBUF:
 		error = _bus_dmamap_load_mbuf_sg(dmat, map, mem->u.md_mbuf,
 		    NULL, &nsegs, flags);
 		break;
 	case MEMDESC_CCB:
 		error = _bus_dmamap_load_ccb(dmat, map, mem->u.md_ccb, &nsegs,
 		    flags);
 		break;
 	}
 	nsegs++;
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 
 	if (error == EINPROGRESS)
 		return (error);
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, 0);
 
 	/*
 	 * Return ENOMEM to the caller so that it can pass it up the stack.
 	 * This error only happens when NOWAIT is set, so deferral is disabled.
 	 */
 	if (error == ENOMEM)
 		return (error);
 
 	return (0);
 }
 
 int
 bus_dmamap_load_crp_buffer(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct crypto_buffer *cb, bus_dmamap_callback_t *callback,
     void *callback_arg, int flags)
 {
 	bus_dma_segment_t *segs;
 	int error;
 	int nsegs;
 
 	flags |= BUS_DMA_NOWAIT;
 	nsegs = -1;
 	error = 0;
 	switch (cb->cb_type) {
 	case CRYPTO_BUF_CONTIG:
 		error = _bus_dmamap_load_buffer(dmat, map, cb->cb_buf,
 		    cb->cb_buf_len, kernel_pmap, flags, NULL, &nsegs);
 		break;
 	case CRYPTO_BUF_MBUF:
 		error = _bus_dmamap_load_mbuf_sg(dmat, map, cb->cb_mbuf,
 		    NULL, &nsegs, flags);
 		break;
 	case CRYPTO_BUF_UIO:
 		error = _bus_dmamap_load_uio(dmat, map, cb->cb_uio, &nsegs,
 		    flags);
 		break;
 	case CRYPTO_BUF_VMPAGE:
 		error = _bus_dmamap_load_ma(dmat, map, cb->cb_vm_page,
 		    cb->cb_vm_page_len, cb->cb_vm_page_offset, flags, NULL,
 		    &nsegs);
 		break;
 	default:
 		error = EINVAL;
 	}
 	nsegs++;
 
 	CTR5(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d nsegs %d",
 	    __func__, dmat, flags, error, nsegs);
 
 	if (error == EINPROGRESS)
 		return (error);
 
 	segs = _bus_dmamap_complete(dmat, map, NULL, nsegs, error);
 	if (error)
 		(*callback)(callback_arg, segs, 0, error);
 	else
 		(*callback)(callback_arg, segs, nsegs, 0);
 
 	/*
 	 * Return ENOMEM to the caller so that it can pass it up the stack.
 	 * This error only happens when NOWAIT is set, so deferral is disabled.
 	 */
 	if (error == ENOMEM)
 		return (error);
 
 	return (0);
 }
 
 int
 bus_dmamap_load_crp(bus_dma_tag_t dmat, bus_dmamap_t map, struct cryptop *crp,
     bus_dmamap_callback_t *callback, void *callback_arg, int flags)
 {
 	return (bus_dmamap_load_crp_buffer(dmat, map, &crp->crp_buf, callback,
 	    callback_arg, flags));
 }
+
+void
+bus_dma_template_init(bus_dma_template_t *t, bus_dma_tag_t parent)
+{
+
+	if (t == NULL)
+		return;
+
+	t->parent = parent;
+	t->alignment = 1;
+	t->boundary = 0;
+	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
+	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
+	t->nsegments = BUS_SPACE_UNRESTRICTED;
+	t->lockfunc = NULL;
+	t->lockfuncarg = NULL;
+	t->flags = 0;
+}
+
+int
+bus_dma_template_tag(bus_dma_template_t *t, bus_dma_tag_t *dmat)
+{
+
+	if (t == NULL || dmat == NULL)
+		return (EINVAL);
+
+	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
+	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
+	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
+	    dmat));
+}
+
+void
+bus_dma_template_fill(bus_dma_template_t *t, bus_dma_param_t *kv, u_int count)
+{
+	bus_dma_param_t *pkv;
+
+	while (count) {
+		pkv = &kv[--count];
+		switch (pkv->key) {
+		case BD_PARAM_PARENT:
+			t->parent = pkv->ptr;
+			break;
+		case BD_PARAM_ALIGNMENT:
+			t->alignment = pkv->num;
+			break;
+		case BD_PARAM_BOUNDARY:
+			t->boundary = pkv->num;
+			break;
+		case BD_PARAM_LOWADDR:
+			t->lowaddr = pkv->pa;
+			break;
+		case BD_PARAM_HIGHADDR:
+			t->highaddr = pkv->pa;
+			break;
+		case BD_PARAM_MAXSIZE:
+			t->maxsize = pkv->num;
+			break;
+		case BD_PARAM_NSEGMENTS:
+			t->nsegments = pkv->num;
+			break;
+		case BD_PARAM_MAXSEGSIZE:
+			t->maxsegsize = pkv->num;
+			break;
+		case BD_PARAM_FLAGS:
+			t->flags = pkv->num;
+			break;
+		case BD_PARAM_LOCKFUNC:
+			t->lockfunc = pkv->ptr;
+			break;
+		case BD_PARAM_LOCKFUNCARG:
+			t->lockfuncarg = pkv->ptr;
+			break;
+		case BD_PARAM_NAME:
+			t->name = pkv->ptr;
+			break;
+		case BD_PARAM_INVALID:
+		default:
+			KASSERT(0, ("Invalid key %d\n", pkv->key));
+			break;
+		}
+	}
+	return;
+}
+
Index: head/sys/mips/mips/busdma_machdep.c
===================================================================
--- head/sys/mips/mips/busdma_machdep.c	(revision 365705)
+++ head/sys/mips/mips/busdma_machdep.c	(revision 365706)
@@ -1,1570 +1,1539 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2006 Oleksandr Tymoshenko
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  *  From i386/busdma_machdep.c,v 1.26 2002/04/19 22:58:09 alfred
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 /*
  * MIPS bus dma support routines
  */
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/busdma_bufalloc.h>
 #include <sys/interrupt.h>
 #include <sys/lock.h>
 #include <sys/proc.h>
 #include <sys/memdesc.h>
 #include <sys/mutex.h>
 #include <sys/ktr.h>
 #include <sys/kernel.h>
 #include <sys/sysctl.h>
 #include <sys/uio.h>
 
 #include <vm/uma.h>
 #include <vm/vm.h>
 #include <vm/vm_extern.h>
 #include <vm/vm_kern.h>
 #include <vm/vm_page.h>
 #include <vm/vm_phys.h>
 #include <vm/vm_map.h>
 
 #include <machine/atomic.h>
 #include <machine/bus.h>
 #include <machine/cache.h>
 #include <machine/cpufunc.h>
 #include <machine/cpuinfo.h>
 #include <machine/md_var.h>
 
 #define MAX_BPAGES 64
 #define BUS_DMA_COULD_BOUNCE	BUS_DMA_BUS3
 #define BUS_DMA_MIN_ALLOC_COMP	BUS_DMA_BUS4
 
 /*
  * On XBurst cores from Ingenic, cache-line writeback is local
  * only, unless accompanied by invalidation. Invalidations force
  * dirty line writeout and invalidation requests forwarded to
  * other cores if other cores have the cache line dirty.
  */
 #if defined(SMP) && defined(CPU_XBURST)
 #define	BUS_DMA_FORCE_WBINV
 #endif
 
 struct bounce_zone;
 
 struct bus_dma_tag {
 	bus_dma_tag_t		parent;
 	bus_size_t		alignment;
 	bus_addr_t		boundary;
 	bus_addr_t		lowaddr;
 	bus_addr_t		highaddr;
 	bus_dma_filter_t	*filter;
 	void			*filterarg;
 	bus_size_t		maxsize;
 	u_int			nsegments;
 	bus_size_t		maxsegsz;
 	int			flags;
 	int			ref_count;
 	int			map_count;
 	bus_dma_lock_t		*lockfunc;
 	void			*lockfuncarg;
 	bus_dma_segment_t	*segments;
 	struct bounce_zone *bounce_zone;
 };
 
 struct bounce_page {
 	vm_offset_t	vaddr;		/* kva of bounce buffer */
 	vm_offset_t	vaddr_nocache;	/* kva of bounce buffer uncached */
 	bus_addr_t	busaddr;	/* Physical address */
 	vm_offset_t	datavaddr;	/* kva of client data */
 	bus_addr_t	dataaddr;	/* client physical address */
 	bus_size_t	datacount;	/* client data count */
 	STAILQ_ENTRY(bounce_page) links;
 };
 
 struct sync_list {
 	vm_offset_t	vaddr;		/* kva of bounce buffer */
 	bus_addr_t	busaddr;	/* Physical address */
 	bus_size_t	datacount;	/* client data count */
 };
 
 int busdma_swi_pending;
 
 struct bounce_zone {
 	STAILQ_ENTRY(bounce_zone) links;
 	STAILQ_HEAD(bp_list, bounce_page) bounce_page_list;
 	int		total_bpages;
 	int		free_bpages;
 	int		reserved_bpages;
 	int		active_bpages;
 	int		total_bounced;
 	int		total_deferred;
 	int		map_count;
 	bus_size_t	alignment;
 	bus_addr_t	lowaddr;
 	char		zoneid[8];
 	char		lowaddrid[20];
 	struct sysctl_ctx_list sysctl_tree;
 	struct sysctl_oid *sysctl_tree_top;
 };
 
 static struct mtx bounce_lock;
 static int total_bpages;
 static int busdma_zonecount;
 static STAILQ_HEAD(, bounce_zone) bounce_zone_list;
 
 static SYSCTL_NODE(_hw, OID_AUTO, busdma, CTLFLAG_RD, 0,
     "Busdma parameters");
 SYSCTL_INT(_hw_busdma, OID_AUTO, total_bpages, CTLFLAG_RD, &total_bpages, 0,
 	   "Total bounce pages");
 
 #define DMAMAP_UNCACHEABLE	0x08
 #define DMAMAP_CACHE_ALIGNED	0x10
 
 struct bus_dmamap {
 	struct bp_list	bpages;
 	int		pagesneeded;
 	int		pagesreserved;
 	bus_dma_tag_t	dmat;
 	struct memdesc	mem;
 	int		flags;
 	TAILQ_ENTRY(bus_dmamap)	freelist;
 	STAILQ_ENTRY(bus_dmamap) links;
 	bus_dmamap_callback_t *callback;
 	void		*callback_arg;
 	int		sync_count;
 	struct sync_list *slist;
 };
 
 static STAILQ_HEAD(, bus_dmamap) bounce_map_waitinglist;
 static STAILQ_HEAD(, bus_dmamap) bounce_map_callbacklist;
 
 static void init_bounce_pages(void *dummy);
 static int alloc_bounce_zone(bus_dma_tag_t dmat);
 static int alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages);
 static int reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map,
 				int commit);
 static bus_addr_t add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map,
 				  vm_offset_t vaddr, bus_addr_t addr,
 				  bus_size_t size);
 static void free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage);
 
 /* Default tag, as most drivers provide no parent tag. */
 bus_dma_tag_t mips_root_dma_tag;
 
 static uma_zone_t dmamap_zone;	/* Cache of struct bus_dmamap items */
 
 static busdma_bufalloc_t coherent_allocator;	/* Cache of coherent buffers */
 static busdma_bufalloc_t standard_allocator;	/* Cache of standard buffers */
 
 MALLOC_DEFINE(M_BUSDMA, "busdma", "busdma metadata");
 MALLOC_DEFINE(M_BOUNCE, "bounce", "busdma bounce pages");
 
 /*
  * This is the ctor function passed to uma_zcreate() for the pool of dma maps.
  * It'll need platform-specific changes if this code is copied.
  */
 static int
 dmamap_ctor(void *mem, int size, void *arg, int flags)
 {
 	bus_dmamap_t map;
 	bus_dma_tag_t dmat;
 
 	map = (bus_dmamap_t)mem;
 	dmat = (bus_dma_tag_t)arg;
 
 	dmat->map_count++;
 
 	bzero(map, sizeof(*map));
 	map->dmat = dmat;
 	STAILQ_INIT(&map->bpages);
 
 	return (0);
 }
 
 /*
  * This is the dtor function passed to uma_zcreate() for the pool of dma maps.
  * It may need platform-specific changes if this code is copied              .
  */
 static void
 dmamap_dtor(void *mem, int size, void *arg)
 {
 	bus_dmamap_t map;
 
 	map = (bus_dmamap_t)mem;
 
 	map->dmat->map_count--;
 }
 
 static void
 busdma_init(void *dummy)
 {
 
 	/* Create a cache of maps for bus_dmamap_create(). */
 	dmamap_zone = uma_zcreate("dma maps", sizeof(struct bus_dmamap),
 	    dmamap_ctor, dmamap_dtor, NULL, NULL, UMA_ALIGN_PTR, 0);
 
 	/* Create a cache of buffers in standard (cacheable) memory. */
 	standard_allocator = busdma_bufalloc_create("buffer",
 	    mips_dcache_max_linesize,	/* minimum_alignment */
 	    NULL,			/* uma_alloc func */
 	    NULL,			/* uma_free func */
 	    0);				/* uma_zcreate_flags */
 
 	/*
 	 * Create a cache of buffers in uncacheable memory, to implement the
 	 * BUS_DMA_COHERENT flag.
 	 */
 	coherent_allocator = busdma_bufalloc_create("coherent",
 	    mips_dcache_max_linesize,	/* minimum_alignment */
 	    busdma_bufalloc_alloc_uncacheable,
 	    busdma_bufalloc_free_uncacheable,
 	    0);				/* uma_zcreate_flags */
 }
 SYSINIT(busdma, SI_SUB_KMEM, SI_ORDER_FOURTH, busdma_init, NULL);
 
 /*
  * Return true if a match is made.
  *
  * To find a match walk the chain of bus_dma_tag_t's looking for 'paddr'.
  *
  * If paddr is within the bounds of the dma tag then call the filter callback
  * to check for a match, if there is no filter callback then assume a match.
  */
 static int
 run_filter(bus_dma_tag_t dmat, bus_addr_t paddr)
 {
 	int retval;
 
 	retval = 0;
 
 	do {
 		if (((paddr > dmat->lowaddr && paddr <= dmat->highaddr)
 		 || ((paddr & (dmat->alignment - 1)) != 0))
 		 && (dmat->filter == NULL
 		  || (*dmat->filter)(dmat->filterarg, paddr) != 0))
 			retval = 1;
 
 		dmat = dmat->parent;
 	} while (retval == 0 && dmat != NULL);
 	return (retval);
 }
 
 /*
  * Check to see if the specified page is in an allowed DMA range.
  */
 
 static __inline int
 _bus_dma_can_bounce(vm_offset_t lowaddr, vm_offset_t highaddr)
 {
 	int i;
 	for (i = 0; phys_avail[i] && phys_avail[i + 1]; i += 2) {
 		if ((lowaddr >= phys_avail[i] && lowaddr <= phys_avail[i + 1])
 		    || (lowaddr < phys_avail[i] &&
 		    highaddr > phys_avail[i]))
 			return (1);
 	}
 	return (0);
 }
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 static void
 dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 #ifdef INVARIANTS
 	panic("driver error: busdma dflt_lock called");
 #else
 	printf("DRIVER_ERROR: busdma dflt_lock called\n");
 #endif
 }
 
 static __inline bus_dmamap_t
 _busdma_alloc_dmamap(bus_dma_tag_t dmat)
 {
 	struct sync_list *slist;
 	bus_dmamap_t map;
 
 	slist = malloc(sizeof(*slist) * dmat->nsegments, M_BUSDMA, M_NOWAIT);
 	if (slist == NULL)
 		return (NULL);
 	map = uma_zalloc_arg(dmamap_zone, dmat, M_NOWAIT);
 	if (map != NULL)
 		map->slist = slist;
 	else
 		free(slist, M_BUSDMA);
 	return (map);
 }
 
 static __inline void
 _busdma_free_dmamap(bus_dmamap_t map)
 {
 
 	free(map->slist, M_BUSDMA);
 	uma_zfree(dmamap_zone, map);
 }
 
 /*
  * Allocate a device specific dma_tag.
  */
 #define SEG_NB 1024
 
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
     bus_addr_t boundary, bus_addr_t lowaddr,
     bus_addr_t highaddr, bus_dma_filter_t *filter,
     void *filterarg, bus_size_t maxsize, int nsegments,
     bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
     void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	bus_dma_tag_t newtag;
 	int error = 0;
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 	if (!parent)
 		parent = mips_root_dma_tag;
 
 	newtag = (bus_dma_tag_t)malloc(sizeof(*newtag), M_BUSDMA, M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, error);
 		return (ENOMEM);
 	}
 
 	newtag->parent = parent;
 	newtag->alignment = alignment;
 	newtag->boundary = boundary;
 	newtag->lowaddr = trunc_page((vm_offset_t)lowaddr) + (PAGE_SIZE - 1);
 	newtag->highaddr = trunc_page((vm_offset_t)highaddr) + (PAGE_SIZE - 1);
 	newtag->filter = filter;
 	newtag->filterarg = filterarg;
 	newtag->maxsize = maxsize;
 	newtag->nsegments = nsegments;
 	newtag->maxsegsz = maxsegsz;
 	newtag->flags = flags;
 	if (cpuinfo.cache_coherent_dma)
 		newtag->flags |= BUS_DMA_COHERENT;
 	newtag->ref_count = 1; /* Count ourself */
 	newtag->map_count = 0;
 	if (lockfunc != NULL) {
 		newtag->lockfunc = lockfunc;
 		newtag->lockfuncarg = lockfuncarg;
 	} else {
 		newtag->lockfunc = dflt_lock;
 		newtag->lockfuncarg = NULL;
 	}
 	newtag->segments = NULL;
 
 	/*
 	 * Take into account any restrictions imposed by our parent tag
 	 */
 	if (parent != NULL) {
 		newtag->lowaddr = MIN(parent->lowaddr, newtag->lowaddr);
 		newtag->highaddr = MAX(parent->highaddr, newtag->highaddr);
 		if (newtag->boundary == 0)
 			newtag->boundary = parent->boundary;
 		else if (parent->boundary != 0)
 			newtag->boundary =
 			    MIN(parent->boundary, newtag->boundary);
 		if ((newtag->filter != NULL) ||
 		    ((parent->flags & BUS_DMA_COULD_BOUNCE) != 0))
 			newtag->flags |= BUS_DMA_COULD_BOUNCE;
 		if (newtag->filter == NULL) {
 			/*
 			* Short circuit looking at our parent directly
 			* since we have encapsulated all of its information
 			*/
 			newtag->filter = parent->filter;
 			newtag->filterarg = parent->filterarg;
 			newtag->parent = parent->parent;
 		}
 		if (newtag->parent != NULL)
 			atomic_add_int(&parent->ref_count, 1);
 	}
 	if (_bus_dma_can_bounce(newtag->lowaddr, newtag->highaddr)
 	 || newtag->alignment > 1)
 		newtag->flags |= BUS_DMA_COULD_BOUNCE;
 
 	if (((newtag->flags & BUS_DMA_COULD_BOUNCE) != 0) &&
 	    (flags & BUS_DMA_ALLOCNOW) != 0) {
 		struct bounce_zone *bz;
 
 		/* Must bounce */
 
 		if ((error = alloc_bounce_zone(newtag)) != 0) {
 			free(newtag, M_BUSDMA);
 			return (error);
 		}
 		bz = newtag->bounce_zone;
 
 		if (ptoa(bz->total_bpages) < maxsize) {
 			int pages;
 
 			pages = atop(maxsize) - bz->total_bpages;
 
 			/* Add pages to our bounce pool */
 			if (alloc_bounce_pages(newtag, pages) < pages)
 				error = ENOMEM;
 		}
 		/* Performed initial allocation */
 		newtag->flags |= BUS_DMA_MIN_ALLOC_COMP;
 	} else
 		newtag->bounce_zone = NULL;
 	if (error != 0)
 		free(newtag, M_BUSDMA);
 	else
 		*dmat = newtag;
 	CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 	    __func__, newtag, (newtag != NULL ? newtag->flags : 0), error);
 
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	t->parent = dmat->parent;
 	t->alignment = dmat->alignment;
 	t->boundary = dmat->boundary;
 	t->lowaddr = dmat->lowaddr;
 	t->highaddr = dmat->highaddr;
 	t->maxsize = dmat->maxsize;
 	t->nsegments = dmat->nsegments;
 	t->maxsegsize = dmat->maxsegsz;
 	t->flags = dmat->flags;
 	t->lockfunc = dmat->lockfunc;
 	t->lockfuncarg = dmat->lockfuncarg;
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 
 	return (0);
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 #ifdef KTR
 	bus_dma_tag_t dmat_copy = dmat;
 #endif
 
 	if (dmat != NULL) {
 		if (dmat->map_count != 0)
 			return (EBUSY);
 
 		while (dmat != NULL) {
 			bus_dma_tag_t parent;
 
 			parent = dmat->parent;
 			atomic_subtract_int(&dmat->ref_count, 1);
 			if (dmat->ref_count == 0) {
 				if (dmat->segments != NULL)
 					free(dmat->segments, M_BUSDMA);
 				free(dmat, M_BUSDMA);
 				/*
 				 * Last reference count, so
 				 * release our reference
 				 * count on our parent.
 				 */
 				dmat = parent;
 			} else
 				dmat = NULL;
 		}
 	}
 	CTR2(KTR_BUSDMA, "%s tag %p", __func__, dmat_copy);
 
 	return (0);
 }
 
 #include <sys/kdb.h>
 /*
  * Allocate a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_create(bus_dma_tag_t dmat, int flags, bus_dmamap_t *mapp)
 {
 	bus_dmamap_t newmap;
 	int error = 0;
 
 	if (dmat->segments == NULL) {
 		dmat->segments = (bus_dma_segment_t *)malloc(
 		    sizeof(bus_dma_segment_t) * dmat->nsegments, M_BUSDMA,
 		    M_NOWAIT);
 		if (dmat->segments == NULL) {
 			CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 			    __func__, dmat, ENOMEM);
 			return (ENOMEM);
 		}
 	}
 
 	newmap = _busdma_alloc_dmamap(dmat);
 	if (newmap == NULL) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d", __func__, dmat, ENOMEM);
 		return (ENOMEM);
 	}
 	*mapp = newmap;
 
 	/*
 	 * Bouncing might be required if the driver asks for an active
 	 * exclusion region, a data alignment that is stricter than 1, and/or
 	 * an active address boundary.
 	 */
 	if (dmat->flags & BUS_DMA_COULD_BOUNCE) {
 		/* Must bounce */
 		struct bounce_zone *bz;
 		int maxpages;
 
 		if (dmat->bounce_zone == NULL) {
 			if ((error = alloc_bounce_zone(dmat)) != 0) {
 				_busdma_free_dmamap(newmap);
 				*mapp = NULL;
 				return (error);
 			}
 		}
 		bz = dmat->bounce_zone;
 
 		/* Initialize the new map */
 		STAILQ_INIT(&((*mapp)->bpages));
 
 		/*
 		 * Attempt to add pages to our pool on a per-instance
 		 * basis up to a sane limit.
 		 */
 		maxpages = MAX_BPAGES;
 		if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0
 		 || (bz->map_count > 0 && bz->total_bpages < maxpages)) {
 			int pages;
 
 			pages = MAX(atop(dmat->maxsize), 1);
 			pages = MIN(maxpages - bz->total_bpages, pages);
 			pages = MAX(pages, 1);
 			if (alloc_bounce_pages(dmat, pages) < pages)
 				error = ENOMEM;
 
 			if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0) {
 				if (error == 0)
 					dmat->flags |= BUS_DMA_MIN_ALLOC_COMP;
 			} else {
 				error = 0;
 			}
 		}
 		bz->map_count++;
 	}
 
 	CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 	    __func__, dmat, dmat->flags, error);
 
 	return (0);
 }
 
 /*
  * Destroy a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_destroy(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 
 	if (STAILQ_FIRST(&map->bpages) != NULL || map->sync_count != 0) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 		    __func__, dmat, EBUSY);
 		return (EBUSY);
 	}
 	if (dmat->bounce_zone)
 		dmat->bounce_zone->map_count--;
 	_busdma_free_dmamap(map);
 	CTR2(KTR_BUSDMA, "%s: tag %p error 0", __func__, dmat);
         return (0);
 }
 
 /*
  * Allocate a piece of memory that can be efficiently mapped into
  * bus device space based on the constraints lited in the dma tag.
  * A dmamap to for use with dmamap_load is also allocated.
  */
 int
 bus_dmamem_alloc(bus_dma_tag_t dmat, void** vaddrp, int flags,
     bus_dmamap_t *mapp)
 {
 	bus_dmamap_t newmap = NULL;
 	busdma_bufalloc_t ba;
 	struct busdma_bufzone *bufzone;
 	vm_memattr_t memattr;
 	void *vaddr;
 
 	int mflags;
 
 	if (flags & BUS_DMA_NOWAIT)
 		mflags = M_NOWAIT;
 	else
 		mflags = M_WAITOK;
 	if (dmat->segments == NULL) {
 		dmat->segments = (bus_dma_segment_t *)malloc(
 		    sizeof(bus_dma_segment_t) * dmat->nsegments, M_BUSDMA,
 		    mflags);
 		if (dmat->segments == NULL) {
 			CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 			    __func__, dmat, dmat->flags, ENOMEM);
 			return (ENOMEM);
 		}
 	}
 
 	newmap = _busdma_alloc_dmamap(dmat);
 	if (newmap == NULL) {
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 		    __func__, dmat, dmat->flags, ENOMEM);
 		return (ENOMEM);
 	}
 
 	/*
 	 * If all the memory is coherent with DMA then we don't need to
 	 * do anything special for a coherent mapping request.
 	 */
 	if (dmat->flags & BUS_DMA_COHERENT)
 	    flags &= ~BUS_DMA_COHERENT;
 
 	if (flags & BUS_DMA_COHERENT) {
 		memattr = VM_MEMATTR_UNCACHEABLE;
 		ba = coherent_allocator;
 		newmap->flags |= DMAMAP_UNCACHEABLE;
 	} else {
 		memattr = VM_MEMATTR_DEFAULT;
 		ba = standard_allocator;
 	}
 	/* All buffers we allocate are cache-aligned. */
 	newmap->flags |= DMAMAP_CACHE_ALIGNED;
 
 	if (flags & BUS_DMA_ZERO)
 		mflags |= M_ZERO;
 
 	/*
 	 * Try to find a bufzone in the allocator that holds a cache of buffers
 	 * of the right size for this request.  If the buffer is too big to be
 	 * held in the allocator cache, this returns NULL.
 	 */
 	bufzone = busdma_bufalloc_findzone(ba, dmat->maxsize);
 
 	/*
 	 * Allocate the buffer from the uma(9) allocator if...
 	 *  - It's small enough to be in the allocator (bufzone not NULL).
 	 *  - The alignment constraint isn't larger than the allocation size
 	 *    (the allocator aligns buffers to their size boundaries).
 	 *  - There's no need to handle lowaddr/highaddr exclusion zones.
 	 * else allocate non-contiguous pages if...
 	 *  - The page count that could get allocated doesn't exceed
 	 *    nsegments also when the maximum segment size is less
 	 *    than PAGE_SIZE.
 	 *  - The alignment constraint isn't larger than a page boundary.
 	 *  - There are no boundary-crossing constraints.
 	 * else allocate a block of contiguous pages because one or more of the
 	 * constraints is something that only the contig allocator can fulfill.
 	 */
 	if (bufzone != NULL && dmat->alignment <= bufzone->size &&
 	    !_bus_dma_can_bounce(dmat->lowaddr, dmat->highaddr)) {
 		vaddr = uma_zalloc(bufzone->umazone, mflags);
 	} else if (dmat->nsegments >=
 	    howmany(dmat->maxsize, MIN(dmat->maxsegsz, PAGE_SIZE)) &&
 	    dmat->alignment <= PAGE_SIZE &&
 	    (dmat->boundary % PAGE_SIZE) == 0) {
 		vaddr = (void *)kmem_alloc_attr(dmat->maxsize, mflags, 0,
 		    dmat->lowaddr, memattr);
 	} else {
 		vaddr = (void *)kmem_alloc_contig(dmat->maxsize, mflags, 0,
 		    dmat->lowaddr, dmat->alignment, dmat->boundary, memattr);
 	}
 	if (vaddr == NULL) {
 		_busdma_free_dmamap(newmap);
 		newmap = NULL;
 	} else {
 		newmap->sync_count = 0;
 	}
 	*vaddrp = vaddr;
 	*mapp = newmap;
 
 	return (vaddr == NULL ? ENOMEM : 0);
 }
 
 /*
  * Free a piece of memory and it's allocated dmamap, that was allocated
  * via bus_dmamem_alloc.  Make the same choice for free/contigfree.
  */
 void
 bus_dmamem_free(bus_dma_tag_t dmat, void *vaddr, bus_dmamap_t map)
 {
 	struct busdma_bufzone *bufzone;
 	busdma_bufalloc_t ba;
 
 	if (map->flags & DMAMAP_UNCACHEABLE)
 		ba = coherent_allocator;
 	else
 		ba = standard_allocator;
 
 	free(map->slist, M_BUSDMA);
 	uma_zfree(dmamap_zone, map);
 
 	bufzone = busdma_bufalloc_findzone(ba, dmat->maxsize);
 
 	if (bufzone != NULL && dmat->alignment <= bufzone->size &&
 	    !_bus_dma_can_bounce(dmat->lowaddr, dmat->highaddr))
 		uma_zfree(bufzone->umazone, vaddr);
 	else
 		kmem_free((vm_offset_t)vaddr, dmat->maxsize);
 	CTR3(KTR_BUSDMA, "%s: tag %p flags 0x%x", __func__, dmat, dmat->flags);
 }
 
 static void
 _bus_dmamap_count_phys(bus_dma_tag_t dmat, bus_dmamap_t map, vm_paddr_t buf,
     bus_size_t buflen, int flags)
 {
 	bus_addr_t curaddr;
 	bus_size_t sgsize;
 
 	if (map->pagesneeded == 0) {
 		CTR3(KTR_BUSDMA, "lowaddr= %d, boundary= %d, alignment= %d",
 		    dmat->lowaddr, dmat->boundary, dmat->alignment);
 		CTR2(KTR_BUSDMA, "map= %p, pagesneeded= %d",
 		    map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		curaddr = buf;
 		while (buflen != 0) {
 			sgsize = MIN(buflen, dmat->maxsegsz);
 			if (run_filter(dmat, curaddr) != 0) {
 				sgsize = MIN(sgsize, PAGE_SIZE);
 				map->pagesneeded++;
 			}
 			curaddr += sgsize;
 			buflen -= sgsize;
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d\n", map->pagesneeded);
 	}
 }
 
 static void
 _bus_dmamap_count_pages(bus_dma_tag_t dmat, bus_dmamap_t map, pmap_t pmap,
     void *buf, bus_size_t buflen, int flags)
 {
 	vm_offset_t vaddr;
 	vm_offset_t vendaddr;
 	bus_addr_t paddr;
 
 	if (map->pagesneeded == 0) {
 		CTR3(KTR_BUSDMA, "lowaddr= %d, boundary= %d, alignment= %d",
 		    dmat->lowaddr, dmat->boundary, dmat->alignment);
 		CTR2(KTR_BUSDMA, "map= %p, pagesneeded= %d",
 		    map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		vaddr = (vm_offset_t)buf;
 		vendaddr = (vm_offset_t)buf + buflen;
 
 		while (vaddr < vendaddr) {
 			bus_size_t sg_len;
 
 			KASSERT(kernel_pmap == pmap, ("pmap is not kernel pmap"));
 			sg_len = PAGE_SIZE - ((vm_offset_t)vaddr & PAGE_MASK);
 			paddr = pmap_kextract(vaddr);
 			if (((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) &&
 			    run_filter(dmat, paddr) != 0) {
 				sg_len = roundup2(sg_len, dmat->alignment);
 				map->pagesneeded++;
 			}
 			vaddr += sg_len;
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d\n", map->pagesneeded);
 	}
 }
 
 static int
 _bus_dmamap_reserve_pages(bus_dma_tag_t dmat, bus_dmamap_t map,int flags)
 {
 
 	/* Reserve Necessary Bounce Pages */
 	mtx_lock(&bounce_lock);
 	if (flags & BUS_DMA_NOWAIT) {
 		if (reserve_bounce_pages(dmat, map, 0) != 0) {
 			mtx_unlock(&bounce_lock);
 			return (ENOMEM);
 		}
 	} else {
 		if (reserve_bounce_pages(dmat, map, 1) != 0) {
 			/* Queue us for resources */
 			STAILQ_INSERT_TAIL(&bounce_map_waitinglist,
 			    map, links);
 			mtx_unlock(&bounce_lock);
 			return (EINPROGRESS);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 
 	return (0);
 }
 
 /*
  * Add a single contiguous physical range to the segment list.
  */
 static int
 _bus_dmamap_addseg(bus_dma_tag_t dmat, bus_dmamap_t map, bus_addr_t curaddr,
     bus_size_t sgsize, bus_dma_segment_t *segs, int *segp)
 {
 	bus_addr_t baddr, bmask;
 	int seg;
 
 	/*
 	 * Make sure we don't cross any boundaries.
 	 */
 	bmask = ~(dmat->boundary - 1);
 	if (dmat->boundary > 0) {
 		baddr = (curaddr + dmat->boundary) & bmask;
 		if (sgsize > (baddr - curaddr))
 			sgsize = (baddr - curaddr);
 	}
 	/*
 	 * Insert chunk into a segment, coalescing with
 	 * the previous segment if possible.
 	 */
 	seg = *segp;
 	if (seg >= 0 &&
 	    curaddr == segs[seg].ds_addr + segs[seg].ds_len &&
 	    (segs[seg].ds_len + sgsize) <= dmat->maxsegsz &&
 	    (dmat->boundary == 0 ||
 	     (segs[seg].ds_addr & bmask) == (curaddr & bmask))) {
 		segs[seg].ds_len += sgsize;
 	} else {
 		if (++seg >= dmat->nsegments)
 			return (0);
 		segs[seg].ds_addr = curaddr;
 		segs[seg].ds_len = sgsize;
 	}
 	*segp = seg;
 	return (sgsize);
 }
 
 /*
  * Utility function to load a physical buffer.  segp contains
  * the starting segment on entrace, and the ending segment on exit.
  */
 int
 _bus_dmamap_load_phys(bus_dma_tag_t dmat, bus_dmamap_t map,
     vm_paddr_t buf, bus_size_t buflen, int flags, bus_dma_segment_t *segs,
     int *segp)
 {
 	bus_addr_t curaddr;
 	bus_size_t sgsize;
 	int error;
 
 	if (segs == NULL)
 		segs = dmat->segments;
 
 	if ((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) {
 		_bus_dmamap_count_phys(dmat, map, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 
 	while (buflen > 0) {
 		curaddr = buf;
 		sgsize = MIN(buflen, dmat->maxsegsz);
 		if (((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) &&
 		    map->pagesneeded != 0 && run_filter(dmat, curaddr)) {
 			sgsize = MIN(sgsize, PAGE_SIZE);
 			curaddr = add_bounce_page(dmat, map, 0, curaddr,
 			    sgsize);
 		}
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		buf += sgsize;
 		buflen -= sgsize;
 	}
 
 	/*
 	 * Did we fit?
 	 */
 	if (buflen != 0) {
 		bus_dmamap_unload(dmat, map);
 		return (EFBIG); /* XXX better return value here? */
 	}
 	return (0);
 }
 
 int
 _bus_dmamap_load_ma(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct vm_page **ma, bus_size_t tlen, int ma_offs, int flags,
     bus_dma_segment_t *segs, int *segp)
 {
 
 	return (bus_dmamap_load_ma_triv(dmat, map, ma, tlen, ma_offs, flags,
 	    segs, segp));
 }
 
 /*
  * Utility function to load a linear buffer.  segp contains
  * the starting segment on entrance, and the ending segment on exit.
  * first indicates if this is the first invocation of this function.
  */
 int
 _bus_dmamap_load_buffer(bus_dma_tag_t dmat, bus_dmamap_t map, void *buf,
     bus_size_t buflen, struct pmap *pmap, int flags, bus_dma_segment_t *segs,
     int *segp)
 {
 	bus_size_t sgsize;
 	bus_addr_t curaddr;
 	struct sync_list *sl;
 	vm_offset_t vaddr = (vm_offset_t)buf;
 	int error = 0;
 
 	if (segs == NULL)
 		segs = dmat->segments;
 	if ((flags & BUS_DMA_LOAD_MBUF) != 0)
 		map->flags |= DMAMAP_CACHE_ALIGNED;
 
 	if ((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) {
 		_bus_dmamap_count_pages(dmat, map, pmap, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 	CTR3(KTR_BUSDMA, "lowaddr= %d boundary= %d, "
 	    "alignment= %d", dmat->lowaddr, dmat->boundary, dmat->alignment);
 
 	while (buflen > 0) {
 		/*
 		 * Get the physical address for this segment.
 		 *
 		 * XXX Don't support checking for coherent mappings
 		 * XXX in user address space.
 		 */
 		KASSERT(kernel_pmap == pmap, ("pmap is not kernel pmap"));
 		curaddr = pmap_kextract(vaddr);
 
 		/*
 		 * Compute the segment size, and adjust counts.
 		 */
 		sgsize = PAGE_SIZE - ((u_long)curaddr & PAGE_MASK);
 		if (sgsize > dmat->maxsegsz)
 			sgsize = dmat->maxsegsz;
 		if (buflen < sgsize)
 			sgsize = buflen;
 
 		if (((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) &&
 		    map->pagesneeded != 0 && run_filter(dmat, curaddr)) {
 			curaddr = add_bounce_page(dmat, map, vaddr, curaddr,
 			    sgsize);
 		} else {
 			sl = &map->slist[map->sync_count - 1];
 			if (map->sync_count == 0 ||
 			    vaddr != sl->vaddr + sl->datacount) {
 				if (++map->sync_count > dmat->nsegments)
 					goto cleanup;
 				sl++;
 				sl->vaddr = vaddr;
 				sl->datacount = sgsize;
 				sl->busaddr = curaddr;
 			} else
 				sl->datacount += sgsize;
 		}
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		vaddr += sgsize;
 		buflen -= sgsize;
 	}
 
 cleanup:
 	/*
 	 * Did we fit?
 	 */
 	if (buflen != 0) {
 		bus_dmamap_unload(dmat, map);
 		error = EFBIG; /* XXX better return value here? */
 	}
 	return (error);
 }
 
 void
 _bus_dmamap_waitok(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct memdesc *mem, bus_dmamap_callback_t *callback, void *callback_arg)
 {
 
 	KASSERT(dmat != NULL, ("dmatag is NULL"));
 	KASSERT(map != NULL, ("dmamap is NULL"));
 	map->mem = *mem;
 	map->callback = callback;
 	map->callback_arg = callback_arg;
 }
 
 bus_dma_segment_t *
 _bus_dmamap_complete(bus_dma_tag_t dmat, bus_dmamap_t map,
     bus_dma_segment_t *segs, int nsegs, int error)
 {
 
 	if (segs == NULL)
 		segs = dmat->segments;
 	return (segs);
 }
 
 /*
  * Release the mapping held by map.
  */
 void
 bus_dmamap_unload(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 	struct bounce_page *bpage;
 
 	while ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
 		STAILQ_REMOVE_HEAD(&map->bpages, links);
 		free_bounce_page(dmat, bpage);
 	}
 	map->sync_count = 0;
 	return;
 }
 
 static void
 bus_dmamap_sync_buf(vm_offset_t buf, int len, bus_dmasync_op_t op, int aligned)
 {
 	char tmp_cl[mips_dcache_max_linesize], tmp_clend[mips_dcache_max_linesize];
 	vm_offset_t buf_cl, buf_clend;
 	vm_size_t size_cl, size_clend;
 	int cache_linesize_mask = mips_dcache_max_linesize - 1;
 
 	/*
 	 * dcache invalidation operates on cache line aligned addresses
 	 * and could modify areas of memory that share the same cache line
 	 * at the beginning and the ending of the buffer. In order to
 	 * prevent a data loss we save these chunks in temporary buffer
 	 * before invalidation and restore them afer it.
 	 *
 	 * If the aligned flag is set the buffer is either an mbuf or came from
 	 * our allocator caches.  In both cases they are always sized and
 	 * aligned to cacheline boundaries, so we can skip preserving nearby
 	 * data if a transfer appears to overlap cachelines.  An mbuf in
 	 * particular will usually appear to be overlapped because of offsetting
 	 * within the buffer to align the L3 headers, but we know that the bytes
 	 * preceeding that offset are part of the same mbuf memory and are not
 	 * unrelated adjacent data (and a rule of mbuf handling is that the cpu
 	 * is not allowed to touch the mbuf while dma is in progress, including
 	 * header fields).
 	 */
 	if (aligned) {
 		size_cl = 0;
 		size_clend = 0;
 	} else {
 		buf_cl = buf & ~cache_linesize_mask;
 		size_cl = buf & cache_linesize_mask;
 		buf_clend = buf + len;
 		size_clend = (mips_dcache_max_linesize -
 		    (buf_clend & cache_linesize_mask)) & cache_linesize_mask;
 	}
 
 	switch (op) {
 	case BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE:
 	case BUS_DMASYNC_POSTREAD:
 
 		/*
 		 * Save buffers that might be modified by invalidation
 		 */
 		if (size_cl)
 			memcpy (tmp_cl, (void*)buf_cl, size_cl);
 		if (size_clend)
 			memcpy (tmp_clend, (void*)buf_clend, size_clend);
 		mips_dcache_inv_range(buf, len);
 		/*
 		 * Restore them
 		 */
 		if (size_cl)
 			memcpy ((void*)buf_cl, tmp_cl, size_cl);
 		if (size_clend)
 			memcpy ((void*)buf_clend, tmp_clend, size_clend);
 		/*
 		 * Copies above have brought corresponding memory
 		 * cache lines back into dirty state. Write them back
 		 * out and invalidate affected cache lines again if
 		 * necessary.
 		 */
 		if (size_cl)
 			mips_dcache_wbinv_range(buf_cl, size_cl);
 		if (size_clend && (size_cl == 0 ||
                     buf_clend - buf_cl > mips_dcache_max_linesize))
 			mips_dcache_wbinv_range(buf_clend, size_clend);
 		break;
 
 	case BUS_DMASYNC_PREREAD|BUS_DMASYNC_PREWRITE:
 		mips_dcache_wbinv_range(buf, len);
 		break;
 
 	case BUS_DMASYNC_PREREAD:
 		/*
 		 * Save buffers that might be modified by invalidation
 		 */
 		if (size_cl)
 			memcpy (tmp_cl, (void *)buf_cl, size_cl);
 		if (size_clend)
 			memcpy (tmp_clend, (void *)buf_clend, size_clend);
 		mips_dcache_inv_range(buf, len);
 		/*
 		 * Restore them
 		 */
 		if (size_cl)
 			memcpy ((void *)buf_cl, tmp_cl, size_cl);
 		if (size_clend)
 			memcpy ((void *)buf_clend, tmp_clend, size_clend);
 		/*
 		 * Copies above have brought corresponding memory
 		 * cache lines back into dirty state. Write them back
 		 * out and invalidate affected cache lines again if
 		 * necessary.
 		 */
 		if (size_cl)
 			mips_dcache_wbinv_range(buf_cl, size_cl);
 		if (size_clend && (size_cl == 0 ||
                     buf_clend - buf_cl > mips_dcache_max_linesize))
 			mips_dcache_wbinv_range(buf_clend, size_clend);
 		break;
 
 	case BUS_DMASYNC_PREWRITE:
 #ifdef BUS_DMA_FORCE_WBINV
 		mips_dcache_wbinv_range(buf, len);
 #else
 		mips_dcache_wb_range(buf, len);
 #endif
 		break;
 	}
 }
 
 static void
 _bus_dmamap_sync_bp(bus_dma_tag_t dmat, bus_dmamap_t map, bus_dmasync_op_t op)
 {
 	struct bounce_page *bpage;
 
 	STAILQ_FOREACH(bpage, &map->bpages, links) {
 		if (op & BUS_DMASYNC_PREWRITE) {
 			if (bpage->datavaddr != 0)
 				bcopy((void *)bpage->datavaddr,
 				    (void *)(bpage->vaddr_nocache != 0 ?
 					     bpage->vaddr_nocache :
 					     bpage->vaddr),
 				    bpage->datacount);
 			else
 				physcopyout(bpage->dataaddr,
 				    (void *)(bpage->vaddr_nocache != 0 ?
 					     bpage->vaddr_nocache :
 					     bpage->vaddr),
 				    bpage->datacount);
 			if (bpage->vaddr_nocache == 0) {
 #ifdef BUS_DMA_FORCE_WBINV
 				mips_dcache_wbinv_range(bpage->vaddr,
 				    bpage->datacount);
 #else
 				mips_dcache_wb_range(bpage->vaddr,
 				    bpage->datacount);
 #endif
 			}
 			dmat->bounce_zone->total_bounced++;
 		}
 		if (op & BUS_DMASYNC_POSTREAD) {
 			if (bpage->vaddr_nocache == 0) {
 				mips_dcache_inv_range(bpage->vaddr,
 				    bpage->datacount);
 			}
 			if (bpage->datavaddr != 0)
 				bcopy((void *)(bpage->vaddr_nocache != 0 ?
 				    bpage->vaddr_nocache : bpage->vaddr),
 				    (void *)bpage->datavaddr, bpage->datacount);
 			else
 				physcopyin((void *)(bpage->vaddr_nocache != 0 ?
 				    bpage->vaddr_nocache : bpage->vaddr),
 				    bpage->dataaddr, bpage->datacount);
 			dmat->bounce_zone->total_bounced++;
 		}
 	}
 }
 
 void
 bus_dmamap_sync(bus_dma_tag_t dmat, bus_dmamap_t map, bus_dmasync_op_t op)
 {
 	struct sync_list *sl, *end;
 	int aligned;
 
 	if (op == BUS_DMASYNC_POSTWRITE)
 		return;
 	if (STAILQ_FIRST(&map->bpages))
 		_bus_dmamap_sync_bp(dmat, map, op);
 
 	if ((dmat->flags & BUS_DMA_COHERENT) ||
 	    (map->flags & DMAMAP_UNCACHEABLE)) {
 		if (op & BUS_DMASYNC_PREWRITE)
 			mips_sync();
 		return;
 	}
 
 	aligned = (map->flags & DMAMAP_CACHE_ALIGNED) ? 1 : 0;
 
 	CTR3(KTR_BUSDMA, "%s: op %x flags %x", __func__, op, map->flags);
 	if (map->sync_count) {
 		end = &map->slist[map->sync_count];
 		for (sl = &map->slist[0]; sl != end; sl++)
 			bus_dmamap_sync_buf(sl->vaddr, sl->datacount, op,
 			    aligned);
 	}
 }
 
 static void
 init_bounce_pages(void *dummy __unused)
 {
 
 	total_bpages = 0;
 	STAILQ_INIT(&bounce_zone_list);
 	STAILQ_INIT(&bounce_map_waitinglist);
 	STAILQ_INIT(&bounce_map_callbacklist);
 	mtx_init(&bounce_lock, "bounce pages lock", NULL, MTX_DEF);
 }
 SYSINIT(bpages, SI_SUB_LOCK, SI_ORDER_ANY, init_bounce_pages, NULL);
 
 static struct sysctl_ctx_list *
 busdma_sysctl_tree(struct bounce_zone *bz)
 {
 	return (&bz->sysctl_tree);
 }
 
 static struct sysctl_oid *
 busdma_sysctl_tree_top(struct bounce_zone *bz)
 {
 	return (bz->sysctl_tree_top);
 }
 
 static int
 alloc_bounce_zone(bus_dma_tag_t dmat)
 {
 	struct bounce_zone *bz;
 
 	/* Check to see if we already have a suitable zone */
 	STAILQ_FOREACH(bz, &bounce_zone_list, links) {
 		if ((dmat->alignment <= bz->alignment)
 		 && (dmat->lowaddr >= bz->lowaddr)) {
 			dmat->bounce_zone = bz;
 			return (0);
 		}
 	}
 
 	if ((bz = (struct bounce_zone *)malloc(sizeof(*bz), M_BUSDMA,
 	    M_NOWAIT | M_ZERO)) == NULL)
 		return (ENOMEM);
 
 	STAILQ_INIT(&bz->bounce_page_list);
 	bz->free_bpages = 0;
 	bz->reserved_bpages = 0;
 	bz->active_bpages = 0;
 	bz->lowaddr = dmat->lowaddr;
 	bz->alignment = MAX(dmat->alignment, PAGE_SIZE);
 	bz->map_count = 0;
 	snprintf(bz->zoneid, 8, "zone%d", busdma_zonecount);
 	busdma_zonecount++;
 	snprintf(bz->lowaddrid, 18, "%#jx", (uintmax_t)bz->lowaddr);
 	STAILQ_INSERT_TAIL(&bounce_zone_list, bz, links);
 	dmat->bounce_zone = bz;
 
 	sysctl_ctx_init(&bz->sysctl_tree);
 	bz->sysctl_tree_top = SYSCTL_ADD_NODE(&bz->sysctl_tree,
 	    SYSCTL_STATIC_CHILDREN(_hw_busdma), OID_AUTO, bz->zoneid,
 	    CTLFLAG_RD | CTLFLAG_MPSAFE, 0, "");
 	if (bz->sysctl_tree_top == NULL) {
 		sysctl_ctx_free(&bz->sysctl_tree);
 		return (0);	/* XXX error code? */
 	}
 
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bpages", CTLFLAG_RD, &bz->total_bpages, 0,
 	    "Total bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "free_bpages", CTLFLAG_RD, &bz->free_bpages, 0,
 	    "Free bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "reserved_bpages", CTLFLAG_RD, &bz->reserved_bpages, 0,
 	    "Reserved bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "active_bpages", CTLFLAG_RD, &bz->active_bpages, 0,
 	    "Active bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bounced", CTLFLAG_RD, &bz->total_bounced, 0,
 	    "Total bounce requests");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_deferred", CTLFLAG_RD, &bz->total_deferred, 0,
 	    "Total bounce requests that were deferred");
 	SYSCTL_ADD_STRING(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "lowaddr", CTLFLAG_RD, bz->lowaddrid, 0, "");
 	SYSCTL_ADD_UAUTO(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "alignment", CTLFLAG_RD, &bz->alignment, "");
 
 	return (0);
 }
 
 static int
 alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages)
 {
 	struct bounce_zone *bz;
 	int count;
 
 	bz = dmat->bounce_zone;
 	count = 0;
 	while (numpages > 0) {
 		struct bounce_page *bpage;
 
 		bpage = (struct bounce_page *)malloc(sizeof(*bpage), M_BUSDMA,
 						     M_NOWAIT | M_ZERO);
 
 		if (bpage == NULL)
 			break;
 		bpage->vaddr = (vm_offset_t)contigmalloc(PAGE_SIZE, M_BOUNCE,
 							 M_NOWAIT, 0ul,
 							 bz->lowaddr,
 							 PAGE_SIZE,
 							 0);
 		if (bpage->vaddr == 0) {
 			free(bpage, M_BUSDMA);
 			break;
 		}
 		bpage->busaddr = pmap_kextract(bpage->vaddr);
 		bpage->vaddr_nocache =
 		    (vm_offset_t)pmap_mapdev(bpage->busaddr, PAGE_SIZE);
 		mtx_lock(&bounce_lock);
 		STAILQ_INSERT_TAIL(&bz->bounce_page_list, bpage, links);
 		total_bpages++;
 		bz->total_bpages++;
 		bz->free_bpages++;
 		mtx_unlock(&bounce_lock);
 		count++;
 		numpages--;
 	}
 	return (count);
 }
 
 static int
 reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map, int commit)
 {
 	struct bounce_zone *bz;
 	int pages;
 
 	mtx_assert(&bounce_lock, MA_OWNED);
 	bz = dmat->bounce_zone;
 	pages = MIN(bz->free_bpages, map->pagesneeded - map->pagesreserved);
 	if (commit == 0 && map->pagesneeded > (map->pagesreserved + pages))
 		return (map->pagesneeded - (map->pagesreserved + pages));
 	bz->free_bpages -= pages;
 	bz->reserved_bpages += pages;
 	map->pagesreserved += pages;
 	pages = map->pagesneeded - map->pagesreserved;
 
 	return (pages);
 }
 
 static bus_addr_t
 add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map, vm_offset_t vaddr,
 		bus_addr_t addr, bus_size_t size)
 {
 	struct bounce_zone *bz;
 	struct bounce_page *bpage;
 
 	KASSERT(dmat->bounce_zone != NULL, ("no bounce zone in dma tag"));
 	KASSERT(map != NULL, ("add_bounce_page: bad map %p", map));
 
 	bz = dmat->bounce_zone;
 	if (map->pagesneeded == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesneeded--;
 
 	if (map->pagesreserved == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesreserved--;
 
 	mtx_lock(&bounce_lock);
 	bpage = STAILQ_FIRST(&bz->bounce_page_list);
 	if (bpage == NULL)
 		panic("add_bounce_page: free page list is empty");
 
 	STAILQ_REMOVE_HEAD(&bz->bounce_page_list, links);
 	bz->reserved_bpages--;
 	bz->active_bpages++;
 	mtx_unlock(&bounce_lock);
 
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/* Page offset needs to be preserved. */
 		bpage->vaddr |= addr & PAGE_MASK;
 		bpage->busaddr |= addr & PAGE_MASK;
 	}
 	bpage->datavaddr = vaddr;
 	bpage->dataaddr = addr;
 	bpage->datacount = size;
 	STAILQ_INSERT_TAIL(&(map->bpages), bpage, links);
 	return (bpage->busaddr);
 }
 
 static void
 free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage)
 {
 	struct bus_dmamap *map;
 	struct bounce_zone *bz;
 
 	bz = dmat->bounce_zone;
 	bpage->datavaddr = 0;
 	bpage->datacount = 0;
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/*
 		 * Reset the bounce page to start at offset 0.  Other uses
 		 * of this bounce page may need to store a full page of
 		 * data and/or assume it starts on a page boundary.
 		 */
 		bpage->vaddr &= ~PAGE_MASK;
 		bpage->busaddr &= ~PAGE_MASK;
 	}
 
 	mtx_lock(&bounce_lock);
 	STAILQ_INSERT_HEAD(&bz->bounce_page_list, bpage, links);
 	bz->free_bpages++;
 	bz->active_bpages--;
 	if ((map = STAILQ_FIRST(&bounce_map_waitinglist)) != NULL) {
 		if (reserve_bounce_pages(map->dmat, map, 1) == 0) {
 			STAILQ_REMOVE_HEAD(&bounce_map_waitinglist, links);
 			STAILQ_INSERT_TAIL(&bounce_map_callbacklist,
 					   map, links);
 			busdma_swi_pending = 1;
 			bz->total_deferred++;
 			swi_sched(vm_ih, 0);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 }
 
 void
 busdma_swi(void)
 {
 	bus_dma_tag_t dmat;
 	struct bus_dmamap *map;
 
 	mtx_lock(&bounce_lock);
 	while ((map = STAILQ_FIRST(&bounce_map_callbacklist)) != NULL) {
 		STAILQ_REMOVE_HEAD(&bounce_map_callbacklist, links);
 		mtx_unlock(&bounce_lock);
 		dmat = map->dmat;
 		(dmat->lockfunc)(dmat->lockfuncarg, BUS_DMA_LOCK);
 		bus_dmamap_load_mem(map->dmat, map, &map->mem, map->callback,
 		    map->callback_arg, BUS_DMA_WAITOK);
 		(dmat->lockfunc)(dmat->lockfuncarg, BUS_DMA_UNLOCK);
 		mtx_lock(&bounce_lock);
 	}
 	mtx_unlock(&bounce_lock);
 }
Index: head/sys/powerpc/powerpc/busdma_machdep.c
===================================================================
--- head/sys/powerpc/powerpc/busdma_machdep.c	(revision 365705)
+++ head/sys/powerpc/powerpc/busdma_machdep.c	(revision 365706)
@@ -1,1273 +1,1242 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 /*
  * From amd64/busdma_machdep.c, r204214
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/interrupt.h>
 #include <sys/kernel.h>
 #include <sys/ktr.h>
 #include <sys/lock.h>
 #include <sys/proc.h>
 #include <sys/memdesc.h>
 #include <sys/mutex.h>
 #include <sys/sysctl.h>
 #include <sys/uio.h>
 
 #include <vm/vm.h>
 #include <vm/vm_extern.h>
 #include <vm/vm_kern.h>
 #include <vm/vm_page.h>
 #include <vm/vm_map.h>
 
 #include <machine/atomic.h>
 #include <machine/bus.h>
 #include <machine/cpufunc.h>
 #include <machine/md_var.h>
 
 #include "iommu_if.h"
 
 #define MAX_BPAGES MIN(8192, physmem/40)
 
 struct bounce_zone;
 
 struct bus_dma_tag {
 	bus_dma_tag_t	  parent;
 	bus_size_t	  alignment;
 	bus_addr_t	  boundary;
 	bus_addr_t	  lowaddr;
 	bus_addr_t	  highaddr;
 	bus_dma_filter_t *filter;
 	void		 *filterarg;
 	bus_size_t	  maxsize;
 	bus_size_t	  maxsegsz;
 	u_int		  nsegments;
 	int		  flags;
 	int		  ref_count;
 	int		  map_count;
 	bus_dma_lock_t	 *lockfunc;
 	void		 *lockfuncarg;
 	struct bounce_zone *bounce_zone;
 	device_t	  iommu;
 	void		 *iommu_cookie;
 };
 
 struct bounce_page {
 	vm_offset_t	vaddr;		/* kva of bounce buffer */
 	bus_addr_t	busaddr;	/* Physical address */
 	vm_offset_t	datavaddr;	/* kva of client data */
 	vm_page_t	datapage;	/* physical page of client data */
 	vm_offset_t	dataoffs;	/* page offset of client data */
 	bus_size_t	datacount;	/* client data count */
 	STAILQ_ENTRY(bounce_page) links;
 };
 
 int busdma_swi_pending;
 
 struct bounce_zone {
 	STAILQ_ENTRY(bounce_zone) links;
 	STAILQ_HEAD(bp_list, bounce_page) bounce_page_list;
 	int		total_bpages;
 	int		free_bpages;
 	int		reserved_bpages;
 	int		active_bpages;
 	int		total_bounced;
 	int		total_deferred;
 	int		map_count;
 	bus_size_t	alignment;
 	bus_addr_t	lowaddr;
 	char		zoneid[8];
 	char		lowaddrid[20];
 	struct sysctl_ctx_list sysctl_tree;
 	struct sysctl_oid *sysctl_tree_top;
 };
 
 static struct mtx bounce_lock;
 static int total_bpages;
 static int busdma_zonecount;
 static STAILQ_HEAD(, bounce_zone) bounce_zone_list;
 
 static SYSCTL_NODE(_hw, OID_AUTO, busdma, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
     "Busdma parameters");
 SYSCTL_INT(_hw_busdma, OID_AUTO, total_bpages, CTLFLAG_RD, &total_bpages, 0,
 	   "Total bounce pages");
 
 struct bus_dmamap {
 	struct bp_list	       bpages;
 	int		       pagesneeded;
 	int		       pagesreserved;
 	bus_dma_tag_t	       dmat;
 	struct memdesc	       mem;
 	bus_dma_segment_t     *segments;
 	int		       nsegs;
 	bus_dmamap_callback_t *callback;
 	void		      *callback_arg;
 	STAILQ_ENTRY(bus_dmamap) links;
 	int		       contigalloc;
 };
 
 static STAILQ_HEAD(, bus_dmamap) bounce_map_waitinglist;
 static STAILQ_HEAD(, bus_dmamap) bounce_map_callbacklist;
 
 static void init_bounce_pages(void *dummy);
 static int alloc_bounce_zone(bus_dma_tag_t dmat);
 static int alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages);
 static int reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map,
 				int commit);
 static bus_addr_t add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map,
 				  vm_offset_t vaddr, bus_addr_t addr,
 				  bus_size_t size);
 static void free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage);
 static __inline int run_filter(bus_dma_tag_t dmat, bus_addr_t paddr);
 
 /*
  * Return true if a match is made.
  *
  * To find a match walk the chain of bus_dma_tag_t's looking for 'paddr'.
  *
  * If paddr is within the bounds of the dma tag then call the filter callback
  * to check for a match, if there is no filter callback then assume a match.
  */
 static __inline int
 run_filter(bus_dma_tag_t dmat, bus_addr_t paddr)
 {
 	int retval;
 
 	retval = 0;
 
 	do {
 		if (dmat->filter == NULL && dmat->iommu == NULL &&
 		    paddr > dmat->lowaddr && paddr <= dmat->highaddr)
 			retval = 1;
 		if (dmat->filter == NULL &&
 		    (paddr & (dmat->alignment - 1)) != 0)
 			retval = 1;
 		if (dmat->filter != NULL &&
 		    (*dmat->filter)(dmat->filterarg, paddr) != 0)
 			retval = 1;
 
 		dmat = dmat->parent;		
 	} while (retval == 0 && dmat != NULL);
 	return (retval);
 }
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 static void
 dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 	panic("driver error: busdma dflt_lock called");
 }
 
 #define BUS_DMA_COULD_BOUNCE	BUS_DMA_BUS3
 #define BUS_DMA_MIN_ALLOC_COMP	BUS_DMA_BUS4
 /*
  * Allocate a device specific dma_tag.
  */
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
 		   bus_addr_t boundary, bus_addr_t lowaddr,
 		   bus_addr_t highaddr, bus_dma_filter_t *filter,
 		   void *filterarg, bus_size_t maxsize, int nsegments,
 		   bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
 		   void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	bus_dma_tag_t newtag;
 	int error = 0;
 
 	/* Basic sanity checking */
 	if (boundary != 0 && boundary < maxsegsz)
 		maxsegsz = boundary;
 
 	if (maxsegsz == 0) {
 		return (EINVAL);
 	}
 
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 
 	newtag = (bus_dma_tag_t)malloc(sizeof(*newtag), M_DEVBUF,
 	    M_ZERO | M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, error);
 		return (ENOMEM);
 	}
 
 	newtag->parent = parent;
 	newtag->alignment = alignment;
 	newtag->boundary = boundary;
 	newtag->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
 	newtag->highaddr = trunc_page((vm_paddr_t)highaddr) + (PAGE_SIZE - 1);
 	newtag->filter = filter;
 	newtag->filterarg = filterarg;
 	newtag->maxsize = maxsize;
 	newtag->nsegments = nsegments;
 	newtag->maxsegsz = maxsegsz;
 	newtag->flags = flags;
 	newtag->ref_count = 1; /* Count ourself */
 	newtag->map_count = 0;
 	if (lockfunc != NULL) {
 		newtag->lockfunc = lockfunc;
 		newtag->lockfuncarg = lockfuncarg;
 	} else {
 		newtag->lockfunc = dflt_lock;
 		newtag->lockfuncarg = NULL;
 	}
 
 	/* Take into account any restrictions imposed by our parent tag */
 	if (parent != NULL) {
 		newtag->lowaddr = MIN(parent->lowaddr, newtag->lowaddr);
 		newtag->highaddr = MAX(parent->highaddr, newtag->highaddr);
 		if (newtag->boundary == 0)
 			newtag->boundary = parent->boundary;
 		else if (parent->boundary != 0)
 			newtag->boundary = MIN(parent->boundary,
 					       newtag->boundary);
 		if (newtag->filter == NULL) {
 			/*
 			 * Short circuit looking at our parent directly
 			 * since we have encapsulated all of its information
 			 */
 			newtag->filter = parent->filter;
 			newtag->filterarg = parent->filterarg;
 			newtag->parent = parent->parent;
 		}
 		if (newtag->parent != NULL)
 			atomic_add_int(&parent->ref_count, 1);
 		newtag->iommu = parent->iommu;
 		newtag->iommu_cookie = parent->iommu_cookie;
 	}
 
 	if (newtag->lowaddr < ptoa((vm_paddr_t)Maxmem) && newtag->iommu == NULL)
 		newtag->flags |= BUS_DMA_COULD_BOUNCE;
 
 	if (newtag->alignment > 1)
 		newtag->flags |= BUS_DMA_COULD_BOUNCE;
 
 	if (((newtag->flags & BUS_DMA_COULD_BOUNCE) != 0) &&
 	    (flags & BUS_DMA_ALLOCNOW) != 0) {
 		struct bounce_zone *bz;
 
 		/* Must bounce */
 
 		if ((error = alloc_bounce_zone(newtag)) != 0) {
 			free(newtag, M_DEVBUF);
 			return (error);
 		}
 		bz = newtag->bounce_zone;
 
 		if (ptoa(bz->total_bpages) < maxsize) {
 			int pages;
 
 			pages = atop(maxsize) - bz->total_bpages;
 
 			/* Add pages to our bounce pool */
 			if (alloc_bounce_pages(newtag, pages) < pages)
 				error = ENOMEM;
 		}
 		/* Performed initial allocation */
 		newtag->flags |= BUS_DMA_MIN_ALLOC_COMP;
 	}
 
 	if (error != 0) {
 		free(newtag, M_DEVBUF);
 	} else {
 		*dmat = newtag;
 	}
 	CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 	    __func__, newtag, (newtag != NULL ? newtag->flags : 0), error);
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	t->parent = dmat->parent;
 	t->alignment = dmat->alignment;
 	t->boundary = dmat->boundary;
 	t->lowaddr = dmat->lowaddr;
 	t->highaddr = dmat->highaddr;
 	t->maxsize = dmat->maxsize;
 	t->nsegments = dmat->nsegments;
 	t->maxsegsize = dmat->maxsegsz;
 	t->flags = dmat->flags;
 	t->lockfunc = dmat->lockfunc;
 	t->lockfuncarg = dmat->lockfuncarg;
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 
 	return (0);
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 	bus_dma_tag_t dmat_copy __unused;
 	int error;
 
 	error = 0;
 	dmat_copy = dmat;
 
 	if (dmat != NULL) {
 		if (dmat->map_count != 0) {
 			error = EBUSY;
 			goto out;
 		}
 
 		while (dmat != NULL) {
 			bus_dma_tag_t parent;
 
 			parent = dmat->parent;
 			atomic_subtract_int(&dmat->ref_count, 1);
 			if (dmat->ref_count == 0) {
 				free(dmat, M_DEVBUF);
 				/*
 				 * Last reference count, so
 				 * release our reference
 				 * count on our parent.
 				 */
 				dmat = parent;
 			} else
 				dmat = NULL;
 		}
 	}
 out:
 	CTR3(KTR_BUSDMA, "%s tag %p error %d", __func__, dmat_copy, error);
 	return (error);
 }
 
 /*
  * Allocate a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_create(bus_dma_tag_t dmat, int flags, bus_dmamap_t *mapp)
 {
 	int error;
 
 	error = 0;
 
 	*mapp = (bus_dmamap_t)malloc(sizeof(**mapp), M_DEVBUF,
 				     M_NOWAIT | M_ZERO);
 	if (*mapp == NULL) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 		    __func__, dmat, ENOMEM);
 		return (ENOMEM);
 	}
 
 	/*
 	 * Bouncing might be required if the driver asks for an active
 	 * exclusion region, a data alignment that is stricter than 1, and/or
 	 * an active address boundary.
 	 */
 	if (dmat->flags & BUS_DMA_COULD_BOUNCE) {
 		/* Must bounce */
 		struct bounce_zone *bz;
 		int maxpages;
 
 		if (dmat->bounce_zone == NULL) {
 			if ((error = alloc_bounce_zone(dmat)) != 0)
 				return (error);
 		}
 		bz = dmat->bounce_zone;
 
 		/* Initialize the new map */
 		STAILQ_INIT(&((*mapp)->bpages));
 
 		/*
 		 * Attempt to add pages to our pool on a per-instance
 		 * basis up to a sane limit.
 		 */
 		if (dmat->alignment > 1)
 			maxpages = MAX_BPAGES;
 		else
 			maxpages = MIN(MAX_BPAGES, Maxmem -atop(dmat->lowaddr));
 		if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0
 		 || (bz->map_count > 0 && bz->total_bpages < maxpages)) {
 			int pages;
 
 			pages = MAX(atop(dmat->maxsize), 1);
 			pages = MIN(maxpages - bz->total_bpages, pages);
 			pages = MAX(pages, 1);
 			if (alloc_bounce_pages(dmat, pages) < pages)
 				error = ENOMEM;
 
 			if ((dmat->flags & BUS_DMA_MIN_ALLOC_COMP) == 0) {
 				if (error == 0)
 					dmat->flags |= BUS_DMA_MIN_ALLOC_COMP;
 			} else {
 				error = 0;
 			}
 		}
 		bz->map_count++;
 	}
 
 	(*mapp)->nsegs = 0;
 	(*mapp)->segments = (bus_dma_segment_t *)malloc(
 	    sizeof(bus_dma_segment_t) * dmat->nsegments, M_DEVBUF,
 	    M_NOWAIT);
 	if ((*mapp)->segments == NULL) {
 		CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 		    __func__, dmat, ENOMEM);
 		return (ENOMEM);
 	}
 
 	if (error == 0)
 		dmat->map_count++;
 	CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 	    __func__, dmat, dmat->flags, error);
 	return (error);
 }
 
 /*
  * Destroy a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 int
 bus_dmamap_destroy(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 	if (dmat->flags & BUS_DMA_COULD_BOUNCE) {
 		if (STAILQ_FIRST(&map->bpages) != NULL) {
 			CTR3(KTR_BUSDMA, "%s: tag %p error %d",
 			    __func__, dmat, EBUSY);
 			return (EBUSY);
 		}
 		if (dmat->bounce_zone)
 			dmat->bounce_zone->map_count--;
 	}
 	free(map->segments, M_DEVBUF);
 	free(map, M_DEVBUF);
 	dmat->map_count--;
 	CTR2(KTR_BUSDMA, "%s: tag %p error 0", __func__, dmat);
 	return (0);
 }
 
 /*
  * Allocate a piece of memory that can be efficiently mapped into
  * bus device space based on the constraints lited in the dma tag.
  * A dmamap to for use with dmamap_load is also allocated.
  */
 int
 bus_dmamem_alloc(bus_dma_tag_t dmat, void** vaddr, int flags,
 		 bus_dmamap_t *mapp)
 {
 	vm_memattr_t attr;
 	int mflags;
 
 	if (flags & BUS_DMA_NOWAIT)
 		mflags = M_NOWAIT;
 	else
 		mflags = M_WAITOK;
 
 	bus_dmamap_create(dmat, flags, mapp);
 
 	if (flags & BUS_DMA_ZERO)
 		mflags |= M_ZERO;
 	if (flags & BUS_DMA_NOCACHE)
 		attr = VM_MEMATTR_UNCACHEABLE;
 	else
 		attr = VM_MEMATTR_DEFAULT;
 
 	/* 
 	 * XXX:
 	 * (dmat->alignment <= dmat->maxsize) is just a quick hack; the exact
 	 * alignment guarantees of malloc need to be nailed down, and the
 	 * code below should be rewritten to take that into account.
 	 *
 	 * In the meantime, we'll warn the user if malloc gets it wrong.
 	 */
 	if ((dmat->maxsize <= PAGE_SIZE) &&
 	   (dmat->alignment <= dmat->maxsize) &&
 	    dmat->lowaddr >= ptoa((vm_paddr_t)Maxmem) &&
 	    attr == VM_MEMATTR_DEFAULT) {
 		*vaddr = malloc(dmat->maxsize, M_DEVBUF, mflags);
 	} else {
 		/*
 		 * XXX Use Contigmalloc until it is merged into this facility
 		 *     and handles multi-seg allocations.  Nobody is doing
 		 *     multi-seg allocations yet though.
 		 * XXX Certain AGP hardware does.
 		 */
 		*vaddr = (void *)kmem_alloc_contig(dmat->maxsize, mflags, 0ul,
 		    dmat->lowaddr, dmat->alignment ? dmat->alignment : 1ul,
 		    dmat->boundary, attr);
 		(*mapp)->contigalloc = 1;
 	}
 	if (*vaddr == NULL) {
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 		    __func__, dmat, dmat->flags, ENOMEM);
 		return (ENOMEM);
 	} else if (vtophys(*vaddr) & (dmat->alignment - 1)) {
 		printf("bus_dmamem_alloc failed to align memory properly.\n");
 	}
 	CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x error %d",
 	    __func__, dmat, dmat->flags, 0);
 	return (0);
 }
 
 /*
  * Free a piece of memory and it's allociated dmamap, that was allocated
  * via bus_dmamem_alloc.  Make the same choice for free/contigfree.
  */
 void
 bus_dmamem_free(bus_dma_tag_t dmat, void *vaddr, bus_dmamap_t map)
 {
 
 	if (!map->contigalloc)
 		free(vaddr, M_DEVBUF);
 	else
 		kmem_free((vm_offset_t)vaddr, dmat->maxsize);
 	bus_dmamap_destroy(dmat, map);
 	CTR3(KTR_BUSDMA, "%s: tag %p flags 0x%x", __func__, dmat, dmat->flags);
 }
 
 static void
 _bus_dmamap_count_phys(bus_dma_tag_t dmat, bus_dmamap_t map, vm_paddr_t buf,
     bus_size_t buflen, int flags)
 {
 	bus_addr_t curaddr;
 	bus_size_t sgsize;
 
 	if (map->pagesneeded == 0) {
 		CTR4(KTR_BUSDMA, "lowaddr= %d Maxmem= %d, boundary= %d, "
 		    "alignment= %d", dmat->lowaddr, ptoa((vm_paddr_t)Maxmem),
 		    dmat->boundary, dmat->alignment);
 		CTR2(KTR_BUSDMA, "map= %p, pagesneeded= %d", map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		curaddr = buf;
 		while (buflen != 0) {
 			sgsize = MIN(buflen, dmat->maxsegsz);
 			if (run_filter(dmat, curaddr) != 0) {
 				sgsize = MIN(sgsize,
 				    PAGE_SIZE - (curaddr & PAGE_MASK));
 				map->pagesneeded++;
 			}
 			curaddr += sgsize;
 			buflen -= sgsize;
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d\n", map->pagesneeded);
 	}
 }
 
 static void
 _bus_dmamap_count_pages(bus_dma_tag_t dmat, bus_dmamap_t map, pmap_t pmap,
     void *buf, bus_size_t buflen, int flags)
 {
         vm_offset_t vaddr;
         vm_offset_t vendaddr;
         bus_addr_t paddr;
 
 	if (map->pagesneeded == 0) {
 		CTR4(KTR_BUSDMA, "lowaddr= %d Maxmem= %d, boundary= %d, "
 		    "alignment= %d", dmat->lowaddr, ptoa((vm_paddr_t)Maxmem),
 		    dmat->boundary, dmat->alignment);
 		CTR2(KTR_BUSDMA, "map= %p, pagesneeded= %d", map, map->pagesneeded);
 		/*
 		 * Count the number of bounce pages
 		 * needed in order to complete this transfer
 		 */
 		vaddr = (vm_offset_t)buf;
 		vendaddr = (vm_offset_t)buf + buflen;
 
 		while (vaddr < vendaddr) {
 			bus_size_t sg_len;
 
 			sg_len = PAGE_SIZE - ((vm_offset_t)vaddr & PAGE_MASK);
 			if (pmap == kernel_pmap)
 				paddr = pmap_kextract(vaddr);
 			else
 				paddr = pmap_extract(pmap, vaddr);
 			if (run_filter(dmat, paddr) != 0) {
 				sg_len = roundup2(sg_len, dmat->alignment);
 				map->pagesneeded++;
 			}
 			vaddr += sg_len;
 		}
 		CTR1(KTR_BUSDMA, "pagesneeded= %d\n", map->pagesneeded);
 	}
 }
 
 static int
 _bus_dmamap_reserve_pages(bus_dma_tag_t dmat, bus_dmamap_t map, int flags)
 {
 
 	/* Reserve Necessary Bounce Pages */
 	mtx_lock(&bounce_lock);
 	if (flags & BUS_DMA_NOWAIT) {
 		if (reserve_bounce_pages(dmat, map, 0) != 0) {
 			mtx_unlock(&bounce_lock);
 			return (ENOMEM);
 		}
 	} else {
 		if (reserve_bounce_pages(dmat, map, 1) != 0) {
 			/* Queue us for resources */
 			STAILQ_INSERT_TAIL(&bounce_map_waitinglist,
 			    map, links);
 			mtx_unlock(&bounce_lock);
 			return (EINPROGRESS);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 
 	return (0);
 }
 
 /*
  * Add a single contiguous physical range to the segment list.
  */
 static int
 _bus_dmamap_addseg(bus_dma_tag_t dmat, bus_dmamap_t map, bus_addr_t curaddr,
 		   bus_size_t sgsize, bus_dma_segment_t *segs, int *segp)
 {
 	bus_addr_t baddr, bmask;
 	int seg;
 
 	/*
 	 * Make sure we don't cross any boundaries.
 	 */
 	bmask = ~(dmat->boundary - 1);
 	if (dmat->boundary > 0) {
 		baddr = (curaddr + dmat->boundary) & bmask;
 		if (sgsize > (baddr - curaddr))
 			sgsize = (baddr - curaddr);
 	}
 
 	/*
 	 * Insert chunk into a segment, coalescing with
 	 * previous segment if possible.
 	 */
 	seg = *segp;
 	if (seg == -1) {
 		seg = 0;
 		segs[seg].ds_addr = curaddr;
 		segs[seg].ds_len = sgsize;
 	} else {
 		if (curaddr == segs[seg].ds_addr + segs[seg].ds_len &&
 		    (segs[seg].ds_len + sgsize) <= dmat->maxsegsz &&
 		    (dmat->boundary == 0 ||
 		     (segs[seg].ds_addr & bmask) == (curaddr & bmask)))
 			segs[seg].ds_len += sgsize;
 		else {
 			if (++seg >= dmat->nsegments)
 				return (0);
 			segs[seg].ds_addr = curaddr;
 			segs[seg].ds_len = sgsize;
 		}
 	}
 	*segp = seg;
 	return (sgsize);
 }
 
 /*
  * Utility function to load a physical buffer.  segp contains
  * the starting segment on entrace, and the ending segment on exit.
  */
 int
 _bus_dmamap_load_phys(bus_dma_tag_t dmat,
 		      bus_dmamap_t map,
 		      vm_paddr_t buf, bus_size_t buflen,
 		      int flags,
 		      bus_dma_segment_t *segs,
 		      int *segp)
 {
 	bus_addr_t curaddr;
 	bus_size_t sgsize;
 	int error;
 
 	if (segs == NULL)
 		segs = map->segments;
 
 	if ((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) {
 		_bus_dmamap_count_phys(dmat, map, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 
 	while (buflen > 0) {
 		curaddr = buf;
 		sgsize = MIN(buflen, dmat->maxsegsz);
 		if (map->pagesneeded != 0 && run_filter(dmat, curaddr)) {
 			sgsize = MIN(sgsize, PAGE_SIZE - (curaddr & PAGE_MASK));
 			curaddr = add_bounce_page(dmat, map, 0, curaddr,
 			    sgsize);
 		}
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		buf += sgsize;
 		buflen -= sgsize;
 	}
 
 	/*
 	 * Did we fit?
 	 */
 	return (buflen != 0 ? EFBIG : 0); /* XXX better return value here? */
 }
 
 int
 _bus_dmamap_load_ma(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct vm_page **ma, bus_size_t tlen, int ma_offs, int flags,
     bus_dma_segment_t *segs, int *segp)
 {
 
 	return (bus_dmamap_load_ma_triv(dmat, map, ma, tlen, ma_offs, flags,
 	    segs, segp));
 }
 
 /*
  * Utility function to load a linear buffer.  segp contains
  * the starting segment on entrance, and the ending segment on exit.
  */
 int
 _bus_dmamap_load_buffer(bus_dma_tag_t dmat,
     			bus_dmamap_t map,
 			void *buf, bus_size_t buflen,
 			pmap_t pmap,
 			int flags,
 			bus_dma_segment_t *segs,
 			int *segp)
 {
 	bus_size_t sgsize;
 	bus_addr_t curaddr;
 	vm_offset_t kvaddr, vaddr;
 	int error;
 
 	if (segs == NULL)
 		segs = map->segments;
 
 	if ((dmat->flags & BUS_DMA_COULD_BOUNCE) != 0) {
 		_bus_dmamap_count_pages(dmat, map, pmap, buf, buflen, flags);
 		if (map->pagesneeded != 0) {
 			error = _bus_dmamap_reserve_pages(dmat, map, flags);
 			if (error)
 				return (error);
 		}
 	}
 
 	vaddr = (vm_offset_t)buf;
 
 	while (buflen > 0) {
 		bus_size_t max_sgsize;
 
 		/*
 		 * Get the physical address for this segment.
 		 */
 		if (pmap == kernel_pmap) {
 			curaddr = pmap_kextract(vaddr);
 			kvaddr = vaddr;
 		} else {
 			curaddr = pmap_extract(pmap, vaddr);
 			kvaddr = 0;
 		}
 
 		/*
 		 * Compute the segment size, and adjust counts.
 		 */
 		max_sgsize = MIN(buflen, dmat->maxsegsz);
 		sgsize = PAGE_SIZE - (curaddr & PAGE_MASK);
 		if (map->pagesneeded != 0 && run_filter(dmat, curaddr)) {
 			sgsize = roundup2(sgsize, dmat->alignment);
 			sgsize = MIN(sgsize, max_sgsize);
 			curaddr = add_bounce_page(dmat, map, kvaddr, curaddr,
 			    sgsize);
 		} else {
 			sgsize = MIN(sgsize, max_sgsize);
 		}
 
 		sgsize = _bus_dmamap_addseg(dmat, map, curaddr, sgsize, segs,
 		    segp);
 		if (sgsize == 0)
 			break;
 		vaddr += sgsize;
 		buflen -= sgsize;
 	}
 
 	/*
 	 * Did we fit?
 	 */
 	return (buflen != 0 ? EFBIG : 0); /* XXX better return value here? */
 }
 
 void
 _bus_dmamap_waitok(bus_dma_tag_t dmat, bus_dmamap_t map,
 		    struct memdesc *mem, bus_dmamap_callback_t *callback,
 		    void *callback_arg)
 {
 
 	if (dmat->flags & BUS_DMA_COULD_BOUNCE) {
 		map->dmat = dmat;
 		map->mem = *mem;
 		map->callback = callback;
 		map->callback_arg = callback_arg;
 	}
 }
 
 bus_dma_segment_t *
 _bus_dmamap_complete(bus_dma_tag_t dmat, bus_dmamap_t map,
 		     bus_dma_segment_t *segs, int nsegs, int error)
 {
 
 	map->nsegs = nsegs;
 	if (segs != NULL)
 		memcpy(map->segments, segs, map->nsegs*sizeof(segs[0]));
 	if (dmat->iommu != NULL)
 		IOMMU_MAP(dmat->iommu, map->segments, &map->nsegs,
 		    dmat->lowaddr, dmat->highaddr, dmat->alignment,
 		    dmat->boundary, dmat->iommu_cookie);
 
 	if (segs != NULL)
 		memcpy(segs, map->segments, map->nsegs*sizeof(segs[0]));
 	else
 		segs = map->segments;
 
 	return (segs);
 }
 
 /*
  * Release the mapping held by map.
  */
 void
 bus_dmamap_unload(bus_dma_tag_t dmat, bus_dmamap_t map)
 {
 	struct bounce_page *bpage;
 
 	if (dmat->iommu) {
 		IOMMU_UNMAP(dmat->iommu, map->segments, map->nsegs, dmat->iommu_cookie);
 		map->nsegs = 0;
 	}
 
 	while ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
 		STAILQ_REMOVE_HEAD(&map->bpages, links);
 		free_bounce_page(dmat, bpage);
 	}
 }
 
 void
 bus_dmamap_sync(bus_dma_tag_t dmat, bus_dmamap_t map, bus_dmasync_op_t op)
 {
 	struct bounce_page *bpage;
 	vm_offset_t datavaddr, tempvaddr;
 
 	if ((bpage = STAILQ_FIRST(&map->bpages)) != NULL) {
 		/*
 		 * Handle data bouncing.  We might also
 		 * want to add support for invalidating
 		 * the caches on broken hardware
 		 */
 		CTR4(KTR_BUSDMA, "%s: tag %p tag flags 0x%x op 0x%x "
 		    "performing bounce", __func__, dmat, dmat->flags, op);
 
 		if (op & BUS_DMASYNC_PREWRITE) {
 			while (bpage != NULL) {
 				tempvaddr = 0;
 				datavaddr = bpage->datavaddr;
 				if (datavaddr == 0) {
 					tempvaddr = pmap_quick_enter_page(
 					    bpage->datapage);
 					datavaddr = tempvaddr |
 					    bpage->dataoffs;
 				}
 
 				bcopy((void *)datavaddr,
 				    (void *)bpage->vaddr, bpage->datacount);
 
 				if (tempvaddr != 0)
 					pmap_quick_remove_page(tempvaddr);
 				bpage = STAILQ_NEXT(bpage, links);
 			}
 			dmat->bounce_zone->total_bounced++;
 		}
 
 		if (op & BUS_DMASYNC_POSTREAD) {
 			while (bpage != NULL) {
 				tempvaddr = 0;
 				datavaddr = bpage->datavaddr;
 				if (datavaddr == 0) {
 					tempvaddr = pmap_quick_enter_page(
 					    bpage->datapage);
 					datavaddr = tempvaddr |
 					    bpage->dataoffs;
 				}
 
 				bcopy((void *)bpage->vaddr,
 				    (void *)datavaddr, bpage->datacount);
 
 				if (tempvaddr != 0)
 					pmap_quick_remove_page(tempvaddr);
 				bpage = STAILQ_NEXT(bpage, links);
 			}
 			dmat->bounce_zone->total_bounced++;
 		}
 	}
 
 	powerpc_sync();
 }
 
 static void
 init_bounce_pages(void *dummy __unused)
 {
 
 	total_bpages = 0;
 	STAILQ_INIT(&bounce_zone_list);
 	STAILQ_INIT(&bounce_map_waitinglist);
 	STAILQ_INIT(&bounce_map_callbacklist);
 	mtx_init(&bounce_lock, "bounce pages lock", NULL, MTX_DEF);
 }
 SYSINIT(bpages, SI_SUB_LOCK, SI_ORDER_ANY, init_bounce_pages, NULL);
 
 static struct sysctl_ctx_list *
 busdma_sysctl_tree(struct bounce_zone *bz)
 {
 	return (&bz->sysctl_tree);
 }
 
 static struct sysctl_oid *
 busdma_sysctl_tree_top(struct bounce_zone *bz)
 {
 	return (bz->sysctl_tree_top);
 }
 
 static int
 alloc_bounce_zone(bus_dma_tag_t dmat)
 {
 	struct bounce_zone *bz;
 
 	/* Check to see if we already have a suitable zone */
 	STAILQ_FOREACH(bz, &bounce_zone_list, links) {
 		if ((dmat->alignment <= bz->alignment)
 		 && (dmat->lowaddr >= bz->lowaddr)) {
 			dmat->bounce_zone = bz;
 			return (0);
 		}
 	}
 
 	if ((bz = (struct bounce_zone *)malloc(sizeof(*bz), M_DEVBUF,
 	    M_NOWAIT | M_ZERO)) == NULL)
 		return (ENOMEM);
 
 	STAILQ_INIT(&bz->bounce_page_list);
 	bz->free_bpages = 0;
 	bz->reserved_bpages = 0;
 	bz->active_bpages = 0;
 	bz->lowaddr = dmat->lowaddr;
 	bz->alignment = MAX(dmat->alignment, PAGE_SIZE);
 	bz->map_count = 0;
 	snprintf(bz->zoneid, 8, "zone%d", busdma_zonecount);
 	busdma_zonecount++;
 	snprintf(bz->lowaddrid, 18, "%#jx", (uintmax_t)bz->lowaddr);
 	STAILQ_INSERT_TAIL(&bounce_zone_list, bz, links);
 	dmat->bounce_zone = bz;
 
 	sysctl_ctx_init(&bz->sysctl_tree);
 	bz->sysctl_tree_top = SYSCTL_ADD_NODE(&bz->sysctl_tree,
 	    SYSCTL_STATIC_CHILDREN(_hw_busdma), OID_AUTO, bz->zoneid,
 	    CTLFLAG_RD | CTLFLAG_MPSAFE, 0, "");
 	if (bz->sysctl_tree_top == NULL) {
 		sysctl_ctx_free(&bz->sysctl_tree);
 		return (0);	/* XXX error code? */
 	}
 
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bpages", CTLFLAG_RD, &bz->total_bpages, 0,
 	    "Total bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "free_bpages", CTLFLAG_RD, &bz->free_bpages, 0,
 	    "Free bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "reserved_bpages", CTLFLAG_RD, &bz->reserved_bpages, 0,
 	    "Reserved bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "active_bpages", CTLFLAG_RD, &bz->active_bpages, 0,
 	    "Active bounce pages");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_bounced", CTLFLAG_RD, &bz->total_bounced, 0,
 	    "Total bounce requests");
 	SYSCTL_ADD_INT(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "total_deferred", CTLFLAG_RD, &bz->total_deferred, 0,
 	    "Total bounce requests that were deferred");
 	SYSCTL_ADD_STRING(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "lowaddr", CTLFLAG_RD, bz->lowaddrid, 0, "");
 	SYSCTL_ADD_UAUTO(busdma_sysctl_tree(bz),
 	    SYSCTL_CHILDREN(busdma_sysctl_tree_top(bz)), OID_AUTO,
 	    "alignment", CTLFLAG_RD, &bz->alignment, "");
 
 	return (0);
 }
 
 static int
 alloc_bounce_pages(bus_dma_tag_t dmat, u_int numpages)
 {
 	struct bounce_zone *bz;
 	int count;
 
 	bz = dmat->bounce_zone;
 	count = 0;
 	while (numpages > 0) {
 		struct bounce_page *bpage;
 
 		bpage = (struct bounce_page *)malloc(sizeof(*bpage), M_DEVBUF,
 						     M_NOWAIT | M_ZERO);
 
 		if (bpage == NULL)
 			break;
 		bpage->vaddr = (vm_offset_t)contigmalloc(PAGE_SIZE, M_DEVBUF,
 							 M_NOWAIT, 0ul,
 							 bz->lowaddr,
 							 PAGE_SIZE,
 							 0);
 		if (bpage->vaddr == 0) {
 			free(bpage, M_DEVBUF);
 			break;
 		}
 		bpage->busaddr = pmap_kextract(bpage->vaddr);
 		mtx_lock(&bounce_lock);
 		STAILQ_INSERT_TAIL(&bz->bounce_page_list, bpage, links);
 		total_bpages++;
 		bz->total_bpages++;
 		bz->free_bpages++;
 		mtx_unlock(&bounce_lock);
 		count++;
 		numpages--;
 	}
 	return (count);
 }
 
 static int
 reserve_bounce_pages(bus_dma_tag_t dmat, bus_dmamap_t map, int commit)
 {
 	struct bounce_zone *bz;
 	int pages;
 
 	mtx_assert(&bounce_lock, MA_OWNED);
 	bz = dmat->bounce_zone;
 	pages = MIN(bz->free_bpages, map->pagesneeded - map->pagesreserved);
 	if (commit == 0 && map->pagesneeded > (map->pagesreserved + pages))
 		return (map->pagesneeded - (map->pagesreserved + pages));
 	bz->free_bpages -= pages;
 	bz->reserved_bpages += pages;
 	map->pagesreserved += pages;
 	pages = map->pagesneeded - map->pagesreserved;
 
 	return (pages);
 }
 
 static bus_addr_t
 add_bounce_page(bus_dma_tag_t dmat, bus_dmamap_t map, vm_offset_t vaddr,
 		bus_addr_t addr, bus_size_t size)
 {
 	struct bounce_zone *bz;
 	struct bounce_page *bpage;
 
 	KASSERT(dmat->bounce_zone != NULL, ("no bounce zone in dma tag"));
 
 	bz = dmat->bounce_zone;
 	if (map->pagesneeded == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesneeded--;
 
 	if (map->pagesreserved == 0)
 		panic("add_bounce_page: map doesn't need any pages");
 	map->pagesreserved--;
 
 	mtx_lock(&bounce_lock);
 	bpage = STAILQ_FIRST(&bz->bounce_page_list);
 	if (bpage == NULL)
 		panic("add_bounce_page: free page list is empty");
 
 	STAILQ_REMOVE_HEAD(&bz->bounce_page_list, links);
 	bz->reserved_bpages--;
 	bz->active_bpages++;
 	mtx_unlock(&bounce_lock);
 
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/* Page offset needs to be preserved. */
 		bpage->vaddr |= addr & PAGE_MASK;
 		bpage->busaddr |= addr & PAGE_MASK;
 	}
 	bpage->datavaddr = vaddr;
 	bpage->datapage = PHYS_TO_VM_PAGE(addr);
 	bpage->dataoffs = addr & PAGE_MASK;
 	bpage->datacount = size;
 	STAILQ_INSERT_TAIL(&(map->bpages), bpage, links);
 	return (bpage->busaddr);
 }
 
 static void
 free_bounce_page(bus_dma_tag_t dmat, struct bounce_page *bpage)
 {
 	struct bus_dmamap *map;
 	struct bounce_zone *bz;
 
 	bz = dmat->bounce_zone;
 	bpage->datavaddr = 0;
 	bpage->datacount = 0;
 	if (dmat->flags & BUS_DMA_KEEP_PG_OFFSET) {
 		/*
 		 * Reset the bounce page to start at offset 0.  Other uses
 		 * of this bounce page may need to store a full page of
 		 * data and/or assume it starts on a page boundary.
 		 */
 		bpage->vaddr &= ~PAGE_MASK;
 		bpage->busaddr &= ~PAGE_MASK;
 	}
 
 	mtx_lock(&bounce_lock);
 	STAILQ_INSERT_HEAD(&bz->bounce_page_list, bpage, links);
 	bz->free_bpages++;
 	bz->active_bpages--;
 	if ((map = STAILQ_FIRST(&bounce_map_waitinglist)) != NULL) {
 		if (reserve_bounce_pages(map->dmat, map, 1) == 0) {
 			STAILQ_REMOVE_HEAD(&bounce_map_waitinglist, links);
 			STAILQ_INSERT_TAIL(&bounce_map_callbacklist,
 					   map, links);
 			busdma_swi_pending = 1;
 			bz->total_deferred++;
 			swi_sched(vm_ih, 0);
 		}
 	}
 	mtx_unlock(&bounce_lock);
 }
 
 void
 busdma_swi(void)
 {
 	bus_dma_tag_t dmat;
 	struct bus_dmamap *map;
 
 	mtx_lock(&bounce_lock);
 	while ((map = STAILQ_FIRST(&bounce_map_callbacklist)) != NULL) {
 		STAILQ_REMOVE_HEAD(&bounce_map_callbacklist, links);
 		mtx_unlock(&bounce_lock);
 		dmat = map->dmat;
 		(dmat->lockfunc)(dmat->lockfuncarg, BUS_DMA_LOCK);
 		bus_dmamap_load_mem(map->dmat, map, &map->mem,
 				    map->callback, map->callback_arg,
 				    BUS_DMA_WAITOK);
 		(dmat->lockfunc)(dmat->lockfuncarg, BUS_DMA_UNLOCK);
 		mtx_lock(&bounce_lock);
 	}
 	mtx_unlock(&bounce_lock);
 }
 
 int
 bus_dma_tag_set_iommu(bus_dma_tag_t tag, device_t iommu, void *cookie)
 {
 	tag->iommu = iommu;
 	tag->iommu_cookie = cookie;
 
 	return (0);
 }
Index: head/sys/riscv/riscv/busdma_machdep.c
===================================================================
--- head/sys/riscv/riscv/busdma_machdep.c	(revision 365705)
+++ head/sys/riscv/riscv/busdma_machdep.c	(revision 365706)
@@ -1,285 +1,254 @@
 /*-
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * Copyright (c) 2013, 2015 The FreeBSD Foundation
  * All rights reserved.
  *
  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
  * under sponsorship from the FreeBSD Foundation.
  *
  * Portions of this software were developed by Semihalf
  * under sponsorship of the FreeBSD Foundation.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/kernel.h>
 #include <sys/ktr.h>
 #include <sys/lock.h>
 #include <sys/memdesc.h>
 #include <sys/mutex.h>
 #include <sys/uio.h>
 #include <vm/vm.h>
 #include <vm/vm_extern.h>
 #include <vm/pmap.h>
 
 #include <machine/bus.h>
 #include <machine/bus_dma_impl.h>
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 void
 bus_dma_dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 
 	panic("driver error: busdma dflt_lock called");
 }
 
 /*
  * Return true if a match is made.
  *
  * To find a match walk the chain of bus_dma_tag_t's looking for 'paddr'.
  *
  * If paddr is within the bounds of the dma tag then call the filter callback
  * to check for a match, if there is no filter callback then assume a match.
  */
 int
 bus_dma_run_filter(struct bus_dma_tag_common *tc, bus_addr_t paddr)
 {
 	int retval;
 
 	retval = 0;
 	do {
 		if (((paddr > tc->lowaddr && paddr <= tc->highaddr) ||
 		    ((paddr & (tc->alignment - 1)) != 0)) &&
 		    (tc->filter == NULL ||
 		    (*tc->filter)(tc->filterarg, paddr) != 0))
 			retval = 1;
 
 		tc = tc->parent;		
 	} while (retval == 0 && tc != NULL);
 	return (retval);
 }
 
 int
 common_bus_dma_tag_create(struct bus_dma_tag_common *parent,
     bus_size_t alignment, bus_addr_t boundary, bus_addr_t lowaddr,
     bus_addr_t highaddr, bus_dma_filter_t *filter, void *filterarg,
     bus_size_t maxsize, int nsegments, bus_size_t maxsegsz, int flags,
     bus_dma_lock_t *lockfunc, void *lockfuncarg, size_t sz, void **dmat)
 {
 	void *newtag;
 	struct bus_dma_tag_common *common;
 
 	KASSERT(sz >= sizeof(struct bus_dma_tag_common), ("sz"));
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 	/* Basic sanity checking */
 	if (boundary != 0 && boundary < maxsegsz)
 		maxsegsz = boundary;
 	if (maxsegsz == 0)
 		return (EINVAL);
 
 	newtag = malloc(sz, M_DEVBUF, M_ZERO | M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, ENOMEM);
 		return (ENOMEM);
 	}
 
 	common = newtag;
 	common->impl = &bus_dma_bounce_impl;
 	common->parent = parent;
 	common->alignment = alignment;
 	common->boundary = boundary;
 	common->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
 	common->highaddr = trunc_page((vm_paddr_t)highaddr) + (PAGE_SIZE - 1);
 	common->filter = filter;
 	common->filterarg = filterarg;
 	common->maxsize = maxsize;
 	common->nsegments = nsegments;
 	common->maxsegsz = maxsegsz;
 	common->flags = flags;
 	common->ref_count = 1; /* Count ourself */
 	if (lockfunc != NULL) {
 		common->lockfunc = lockfunc;
 		common->lockfuncarg = lockfuncarg;
 	} else {
 		common->lockfunc = bus_dma_dflt_lock;
 		common->lockfuncarg = NULL;
 	}
 
 	/* Take into account any restrictions imposed by our parent tag */
 	if (parent != NULL) {
 		common->impl = parent->impl;
 		common->lowaddr = MIN(parent->lowaddr, common->lowaddr);
 		common->highaddr = MAX(parent->highaddr, common->highaddr);
 		if (common->boundary == 0)
 			common->boundary = parent->boundary;
 		else if (parent->boundary != 0) {
 			common->boundary = MIN(parent->boundary,
 			    common->boundary);
 		}
 		if (common->filter == NULL) {
 			/*
 			 * Short circuit looking at our parent directly
 			 * since we have encapsulated all of its information
 			 */
 			common->filter = parent->filter;
 			common->filterarg = parent->filterarg;
 			common->parent = parent->parent;
 		}
 		atomic_add_int(&parent->ref_count, 1);
 	}
 	*dmat = common;
 	return (0);
 }
 
 /*
  * Allocate a device specific dma_tag.
  */
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
     bus_addr_t boundary, bus_addr_t lowaddr, bus_addr_t highaddr,
     bus_dma_filter_t *filter, void *filterarg, bus_size_t maxsize,
     int nsegments, bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
     void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	struct bus_dma_tag_common *tc;
 	int error;
 
 	if (parent == NULL) {
 		error = bus_dma_bounce_impl.tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	} else {
 		tc = (struct bus_dma_tag_common *)parent;
 		error = tc->impl->tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	}
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *common;
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	common = (struct bus_dma_tag_common *)dmat;
 
 	t->parent = (bus_dma_tag_t)common->parent;
 	t->alignment = common->alignment;
 	t->boundary = common->boundary;
 	t->lowaddr = common->lowaddr;
 	t->highaddr = common->highaddr;
 	t->maxsize = common->maxsize;
 	t->nsegments = common->nsegments;
 	t->maxsegsize = common->maxsegsz;
 	t->flags = common->flags;
 	t->lockfunc = common->lockfunc;
 	t->lockfuncarg = common->lockfuncarg;
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *tc;
 
 	tc = (struct bus_dma_tag_common *)dmat;
 	return (tc->impl->tag_destroy(dmat));
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 
 	return (0);
 }
Index: head/sys/sys/bus_dma.h
===================================================================
--- head/sys/sys/bus_dma.h	(revision 365705)
+++ head/sys/sys/bus_dma.h	(revision 365706)
@@ -1,341 +1,400 @@
 /*	$NetBSD: bus.h,v 1.12 1997/10/01 08:25:15 fvdl Exp $	*/
 
 /*-
  * SPDX-License-Identifier: (BSD-2-Clause-NetBSD AND BSD-4-Clause)
  *
  * Copyright (c) 1996, 1997 The NetBSD Foundation, Inc.
  * All rights reserved.
  *
  * This code is derived from software contributed to The NetBSD Foundation
  * by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
  * NASA Ames Research Center.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  * POSSIBILITY OF SUCH DAMAGE.
  */
 
 /*-
  * Copyright (c) 1996 Charles M. Hannum.  All rights reserved.
  * Copyright (c) 1996 Christopher G. Demetriou.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. All advertising materials mentioning features or use of this software
  *    must display the following acknowledgement:
  *      This product includes software developed by Christopher G. Demetriou
  *	for the NetBSD Project.
  * 4. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 /* $FreeBSD$ */
 
 #ifndef _BUS_DMA_H_
 #define _BUS_DMA_H_
 
 #ifdef _KERNEL
 #include <sys/_bus_dma.h>
 #endif
 
 /*
  * Machine independent interface for mapping physical addresses to peripheral
  * bus 'physical' addresses, and assisting with DMA operations.
  *
  * XXX This file is always included from <machine/bus_dma.h> and should not
  *     (yet) be included directly.
  */
 
 /*
  * Flags used in various bus DMA methods.
  */
 #define	BUS_DMA_WAITOK		0x00	/* safe to sleep (pseudo-flag) */
 #define	BUS_DMA_NOWAIT		0x01	/* not safe to sleep */
 #define	BUS_DMA_ALLOCNOW	0x02	/* perform resource allocation now */
 #define	BUS_DMA_COHERENT	0x04	/* hint: map memory in a coherent way */
 #define	BUS_DMA_ZERO		0x08	/* allocate zero'ed memory */
 #define	BUS_DMA_BUS1		0x10	/* placeholders for bus functions... */
 #define	BUS_DMA_BUS2		0x20
 #define	BUS_DMA_BUS3		0x40
 #define	BUS_DMA_BUS4		0x80
 
 /*
  * The following two flags are non-standard or specific to only certain
  * architectures
  */
 #define	BUS_DMA_NOWRITE		0x100
 #define	BUS_DMA_NOCACHE		0x200
 
 /*
  * The following flag is a DMA tag hint that the page offset of the
  * loaded kernel virtual address must be preserved in the first
  * physical segment address, when the KVA is loaded into DMA.
  */
 #define	BUS_DMA_KEEP_PG_OFFSET	0x400
 
 #define	BUS_DMA_LOAD_MBUF	0x800
 
 /* Forwards needed by prototypes below. */
 union ccb;
 struct bio;
 struct crypto_buffer;
 struct cryptop;
 struct mbuf;
 struct memdesc;
 struct pmap;
 struct uio;
 
 /*
  * Operations performed by bus_dmamap_sync().
  */
 #define	BUS_DMASYNC_PREREAD	1
 #define	BUS_DMASYNC_POSTREAD	2
 #define	BUS_DMASYNC_PREWRITE	4
 #define	BUS_DMASYNC_POSTWRITE	8
 
 /*
  *	bus_dma_segment_t
  *
  *	Describes a single contiguous DMA transaction.  Values
  *	are suitable for programming into DMA registers.
  */
 typedef struct bus_dma_segment {
 	bus_addr_t	ds_addr;	/* DMA address */
 	bus_size_t	ds_len;		/* length of transfer */
 } bus_dma_segment_t;
 
 #ifdef _KERNEL
 /*
  * A function that returns 1 if the address cannot be accessed by
  * a device and 0 if it can be.
  */
 typedef int bus_dma_filter_t(void *, bus_addr_t);
 
 /*
  * Generic helper function for manipulating mutexes.
  */
 void busdma_lock_mutex(void *arg, bus_dma_lock_op_t op);
 
 /*
  * Allocate a device specific dma_tag encapsulating the constraints of
  * the parent tag in addition to other restrictions specified:
  *
  *	alignment:	Alignment for segments.
  *	boundary:	Boundary that segments cannot cross.
  *	lowaddr:	Low restricted address that cannot appear in a mapping.
  *	highaddr:	High restricted address that cannot appear in a mapping.
  *	filtfunc:	An optional function to further test if an address
  *			within the range of lowaddr and highaddr cannot appear
  *			in a mapping.
  *	filtfuncarg:	An argument that will be passed to filtfunc in addition
  *			to the address to test.
  *	maxsize:	Maximum mapping size supported by this tag.
  *	nsegments:	Number of discontinuities allowed in maps.
  *	maxsegsz:	Maximum size of a segment in the map.
  *	flags:		Bus DMA flags.
  *	lockfunc:	An optional function to handle driver-defined lock
  *			operations.
  *	lockfuncarg:	An argument that will be passed to lockfunc in addition
  *			to the lock operation.
  *	dmat:		A pointer to set to a valid dma tag should the return
  *			value of this function indicate success.
  */
 /* XXX Should probably allow specification of alignment */
 int bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
 		       bus_addr_t boundary, bus_addr_t lowaddr,
 		       bus_addr_t highaddr, bus_dma_filter_t *filtfunc,
 		       void *filtfuncarg, bus_size_t maxsize, int nsegments,
 		       bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
 		       void *lockfuncarg, bus_dma_tag_t *dmat);
 
-/* Functions for creating and cloning tags via a template */
+/*
+ * Functions for creating and cloning tags via a template,
+ *
+ * bus_dma_template_t is made avaialble publicly so it can be allocated
+ * from the caller stack.  Its contents should be considered private, and
+ * should only be accessed via the documented APIs and macros
+ */
 typedef struct {
 	bus_dma_tag_t		parent;
 	bus_size_t		alignment;
 	bus_addr_t		boundary;
 	bus_addr_t		lowaddr;
 	bus_addr_t		highaddr;
 	bus_size_t		maxsize;
 	int			nsegments;
 	bus_size_t		maxsegsize;
 	int			flags;
 	bus_dma_lock_t		*lockfunc;
 	void			*lockfuncarg;
-} bus_dma_tag_template_t;
-void bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent);
-int bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat);
-void bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat);
+	const char		*name;
+} bus_dma_template_t;
+
+/*
+ * These enum values should not be re-ordered.  BD_PARAM_INVALID is an
+ * invalid key and will trigger a panic.
+ */
+typedef enum {
+	BD_PARAM_INVALID	= 0,
+	BD_PARAM_PARENT		= 1,
+	BD_PARAM_ALIGNMENT	= 2,
+	BD_PARAM_BOUNDARY	= 3,
+	BD_PARAM_LOWADDR	= 4,
+	BD_PARAM_HIGHADDR	= 5,
+	BD_PARAM_MAXSIZE	= 6,
+	BD_PARAM_NSEGMENTS	= 7,
+	BD_PARAM_MAXSEGSIZE	= 8,
+	BD_PARAM_FLAGS		= 9,
+	BD_PARAM_LOCKFUNC	= 10,
+	BD_PARAM_LOCKFUNCARG	= 11,
+	BD_PARAM_NAME		= 12
+} bus_dma_param_key_t;
+
+/* These contents should also be considered private */
+typedef struct {
+	bus_dma_param_key_t	key;
+	union {
+		void *ptr;
+		vm_paddr_t pa;
+		uintmax_t num;
+	};
+} bus_dma_param_t;
+
+#define BD_PARENT(val)		{ BD_PARAM_PARENT, .ptr = val }
+#define BD_ALIGNMENT(val)	{ BD_PARAM_ALIGNMENT, .num = val }
+#define BD_BOUNDARY(val)	{ BD_PARAM_BOUNDARY, .num = val }
+#define BD_LOWADDR(val)		{ BD_PARAM_LOWADDR, .pa = val }
+#define BD_HIGHADDR(val)	{ BD_PARAM_HIGHADDR, .pa = val }
+#define BD_MAXSIZE(val)		{ BD_PARAM_MAXSIZE, .num = val }
+#define BD_NSEGMENTS(val)	{ BD_PARAM_NSEGMENTS, .num = val }
+#define BD_MAXSEGSIZE(val)	{ BD_PARAM_MAXSEGSIZE, .num = val }
+#define BD_FLAGS(val)		{ BD_PARAM_FLAGS, .num = val }
+#define BD_LOCKFUNC(val)	{ BD_PARAM_LOCKFUNC, .ptr = val }
+#define BD_LOCKFUNCARG(val)	{ BD_PARAM_LOCKFUNCARG, .ptr = val }
+#define BD_NAME(val)		{ BD_PARAM_NAME, .ptr = val }
+
+#define BUS_DMA_TEMPLATE_FILL(t, kv...) \
+do {					\
+	bus_dma_param_t pm[] = { kv };	\
+	bus_dma_template_fill(t, pm, howmany(sizeof(pm), sizeof(pm[0]))); \
+} while (0)
+
+void bus_dma_template_init(bus_dma_template_t *t, bus_dma_tag_t parent);
+int bus_dma_template_tag(bus_dma_template_t *t, bus_dma_tag_t *dmat);
+void bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat);
+void bus_dma_template_fill(bus_dma_template_t *t, bus_dma_param_t *kv,
+    u_int count);
 
 /*
  * Set the memory domain to be used for allocations.
  *
  * Automatic for PCI devices.  Must be set prior to creating maps or
  * allocating memory.
  */
 int bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain);
 
 int bus_dma_tag_destroy(bus_dma_tag_t dmat);
 
 /*
  * A function that processes a successfully loaded dma map or an error
  * from a delayed load map.
  */
 typedef void bus_dmamap_callback_t(void *, bus_dma_segment_t *, int, int);
 
 /*
  * Like bus_dmamap_callback but includes map size in bytes.  This is
  * defined as a separate interface to maintain compatibility for users
  * of bus_dmamap_callback_t--at some point these interfaces should be merged.
  */
 typedef void bus_dmamap_callback2_t(void *, bus_dma_segment_t *, int, bus_size_t, int);
 
 /*
  * Map the buffer buf into bus space using the dmamap map.
  */
 int bus_dmamap_load(bus_dma_tag_t dmat, bus_dmamap_t map, void *buf,
 		    bus_size_t buflen, bus_dmamap_callback_t *callback,
 		    void *callback_arg, int flags);
 
 /*
  * Like bus_dmamap_load but for mbufs.  Note the use of the
  * bus_dmamap_callback2_t interface.
  */
 int bus_dmamap_load_mbuf(bus_dma_tag_t dmat, bus_dmamap_t map,
 			 struct mbuf *mbuf,
 			 bus_dmamap_callback2_t *callback, void *callback_arg,
 			 int flags);
 
 int bus_dmamap_load_mbuf_sg(bus_dma_tag_t dmat, bus_dmamap_t map,
 			    struct mbuf *mbuf, bus_dma_segment_t *segs,
 			    int *nsegs, int flags);
 
 /*
  * Like bus_dmamap_load but for uios.  Note the use of the
  * bus_dmamap_callback2_t interface.
  */
 int bus_dmamap_load_uio(bus_dma_tag_t dmat, bus_dmamap_t map,
 			struct uio *ui,
 			bus_dmamap_callback2_t *callback, void *callback_arg,
 			int flags);
 
 /*
  * Like bus_dmamap_load but for cam control blocks.
  */
 int bus_dmamap_load_ccb(bus_dma_tag_t dmat, bus_dmamap_t map, union ccb *ccb,
 			bus_dmamap_callback_t *callback, void *callback_arg,
 			int flags);
 
 /*
  * Like bus_dmamap_load but for bios.
  */
 int bus_dmamap_load_bio(bus_dma_tag_t dmat, bus_dmamap_t map, struct bio *bio,
 			bus_dmamap_callback_t *callback, void *callback_arg,
 			int flags);
 
 /*
  * Like bus_dmamap_load but for crypto ops.
  */
 int bus_dmamap_load_crp(bus_dma_tag_t dmat, bus_dmamap_t map,
 			struct cryptop *crp, bus_dmamap_callback_t *callback,
 			void *callback_arg, int flags);
 int bus_dmamap_load_crp_buffer(bus_dma_tag_t dmat, bus_dmamap_t map,
 			       struct crypto_buffer *cb,
 			       bus_dmamap_callback_t *callback,
 			       void *callback_arg, int flags);
 
 /*
  * Loads any memory descriptor.
  */
 int bus_dmamap_load_mem(bus_dma_tag_t dmat, bus_dmamap_t map,
 			struct memdesc *mem, bus_dmamap_callback_t *callback,
 			void *callback_arg, int flags);
 
 /*
  * Placeholder for use by busdma implementations which do not benefit
  * from optimized procedure to load an array of vm_page_t.  Falls back
  * to do _bus_dmamap_load_phys() in loop.
  */
 int bus_dmamap_load_ma_triv(bus_dma_tag_t dmat, bus_dmamap_t map,
     struct vm_page **ma, bus_size_t tlen, int ma_offs, int flags,
     bus_dma_segment_t *segs, int *segp);
 
 #ifdef WANT_INLINE_DMAMAP
 #define BUS_DMAMAP_OP static inline
 #else
 #define BUS_DMAMAP_OP
 #endif
 
 /*
  * Allocate a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 BUS_DMAMAP_OP int bus_dmamap_create(bus_dma_tag_t dmat, int flags, bus_dmamap_t *mapp);
 
 /*
  * Destroy a handle for mapping from kva/uva/physical
  * address space into bus device space.
  */
 BUS_DMAMAP_OP int bus_dmamap_destroy(bus_dma_tag_t dmat, bus_dmamap_t map);
 
 /*
  * Allocate a piece of memory that can be efficiently mapped into
  * bus device space based on the constraints listed in the dma tag.
  * A dmamap to for use with dmamap_load is also allocated.
  */
 BUS_DMAMAP_OP int bus_dmamem_alloc(bus_dma_tag_t dmat, void** vaddr, int flags,
 		     bus_dmamap_t *mapp);
 
 /*
  * Free a piece of memory and its allocated dmamap, that was allocated
  * via bus_dmamem_alloc.
  */
 BUS_DMAMAP_OP void bus_dmamem_free(bus_dma_tag_t dmat, void *vaddr, bus_dmamap_t map);
 
 /*
  * Perform a synchronization operation on the given map. If the map
  * is NULL we have a fully IO-coherent system.
  */
 BUS_DMAMAP_OP void bus_dmamap_sync(bus_dma_tag_t dmat, bus_dmamap_t dmamap, bus_dmasync_op_t op);
 
 /*
  * Release the mapping held by map.
  */
 BUS_DMAMAP_OP void bus_dmamap_unload(bus_dma_tag_t dmat, bus_dmamap_t dmamap);
 
 #undef BUS_DMAMAP_OP
 #endif /* _KERNEL */
 
 #endif /* _BUS_DMA_H_ */
Index: head/sys/x86/x86/busdma_machdep.c
===================================================================
--- head/sys/x86/x86/busdma_machdep.c	(revision 365705)
+++ head/sys/x86/x86/busdma_machdep.c	(revision 365706)
@@ -1,319 +1,288 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 1997, 1998 Justin T. Gibbs.
  * Copyright (c) 2013 The FreeBSD Foundation
  * All rights reserved.
  *
  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
  * under sponsorship from the FreeBSD Foundation.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions, and the following disclaimer,
  *    without modification, immediately at the beginning of the file.
  * 2. The name of the author may not be used to endorse or promote products
  *    derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE FOR
  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include "opt_acpi.h"
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
 #include <sys/bus.h>
 #include <sys/kernel.h>
 #include <sys/ktr.h>
 #include <sys/lock.h>
 #include <sys/memdesc.h>
 #include <sys/mutex.h>
 #include <sys/uio.h>
 #include <sys/vmmeter.h>
 #include <vm/vm.h>
 #include <vm/vm_extern.h>
 #include <vm/vm_param.h>
 #include <vm/vm_page.h>
 #include <vm/vm_phys.h>
 #include <vm/pmap.h>
 #include <machine/bus.h>
 #include <x86/include/busdma_impl.h>
 
 /*
  * Convenience function for manipulating driver locks from busdma (during
  * busdma_swi, for example).  Drivers that don't provide their own locks
  * should specify &Giant to dmat->lockfuncarg.  Drivers that use their own
  * non-mutex locking scheme don't have to use this at all.
  */
 void
 busdma_lock_mutex(void *arg, bus_dma_lock_op_t op)
 {
 	struct mtx *dmtx;
 
 	dmtx = (struct mtx *)arg;
 	switch (op) {
 	case BUS_DMA_LOCK:
 		mtx_lock(dmtx);
 		break;
 	case BUS_DMA_UNLOCK:
 		mtx_unlock(dmtx);
 		break;
 	default:
 		panic("Unknown operation 0x%x for busdma_lock_mutex!", op);
 	}
 }
 
 /*
  * dflt_lock should never get called.  It gets put into the dma tag when
  * lockfunc == NULL, which is only valid if the maps that are associated
  * with the tag are meant to never be defered.
  * XXX Should have a way to identify which driver is responsible here.
  */
 void
 bus_dma_dflt_lock(void *arg, bus_dma_lock_op_t op)
 {
 
 	panic("driver error: busdma dflt_lock called");
 }
 
 /*
  * Return true if a match is made.
  *
  * To find a match walk the chain of bus_dma_tag_t's looking for 'paddr'.
  *
  * If paddr is within the bounds of the dma tag then call the filter callback
  * to check for a match, if there is no filter callback then assume a match.
  */
 int
 bus_dma_run_filter(struct bus_dma_tag_common *tc, vm_paddr_t paddr)
 {
 	int retval;
 
 	retval = 0;
 	do {
 		if ((paddr >= BUS_SPACE_MAXADDR ||
 		    (paddr > tc->lowaddr && paddr <= tc->highaddr) ||
 		    (paddr & (tc->alignment - 1)) != 0) &&
 		    (tc->filter == NULL ||
 		    (*tc->filter)(tc->filterarg, paddr) != 0))
 			retval = 1;
 
 		tc = tc->parent;		
 	} while (retval == 0 && tc != NULL);
 	return (retval);
 }
 
 int
 common_bus_dma_tag_create(struct bus_dma_tag_common *parent,
     bus_size_t alignment, bus_addr_t boundary, bus_addr_t lowaddr,
     bus_addr_t highaddr, bus_dma_filter_t *filter, void *filterarg,
     bus_size_t maxsize, int nsegments, bus_size_t maxsegsz, int flags,
     bus_dma_lock_t *lockfunc, void *lockfuncarg, size_t sz, void **dmat)
 {
 	void *newtag;
 	struct bus_dma_tag_common *common;
 
 	KASSERT(sz >= sizeof(struct bus_dma_tag_common), ("sz"));
 	/* Basic sanity checking */
 	if (boundary != 0 && boundary < maxsegsz)
 		maxsegsz = boundary;
 	if (maxsegsz == 0)
 		return (EINVAL);
 	/* Return a NULL tag on failure */
 	*dmat = NULL;
 
 	newtag = malloc(sz, M_DEVBUF, M_ZERO | M_NOWAIT);
 	if (newtag == NULL) {
 		CTR4(KTR_BUSDMA, "%s returned tag %p tag flags 0x%x error %d",
 		    __func__, newtag, 0, ENOMEM);
 		return (ENOMEM);
 	}
 
 	common = newtag;
 	common->impl = &bus_dma_bounce_impl;
 	common->parent = parent;
 	common->alignment = alignment;
 	common->boundary = boundary;
 	common->lowaddr = trunc_page((vm_paddr_t)lowaddr) + (PAGE_SIZE - 1);
 	common->highaddr = trunc_page((vm_paddr_t)highaddr) + (PAGE_SIZE - 1);
 	common->filter = filter;
 	common->filterarg = filterarg;
 	common->maxsize = maxsize;
 	common->nsegments = nsegments;
 	common->maxsegsz = maxsegsz;
 	common->flags = flags;
 	common->ref_count = 1; /* Count ourself */
 	if (lockfunc != NULL) {
 		common->lockfunc = lockfunc;
 		common->lockfuncarg = lockfuncarg;
 	} else {
 		common->lockfunc = bus_dma_dflt_lock;
 		common->lockfuncarg = NULL;
 	}
 
 	/* Take into account any restrictions imposed by our parent tag */
 	if (parent != NULL) {
 		common->impl = parent->impl;
 		common->lowaddr = MIN(parent->lowaddr, common->lowaddr);
 		common->highaddr = MAX(parent->highaddr, common->highaddr);
 		if (common->boundary == 0)
 			common->boundary = parent->boundary;
 		else if (parent->boundary != 0) {
 			common->boundary = MIN(parent->boundary,
 			    common->boundary);
 		}
 		if (common->filter == NULL) {
 			/*
 			 * Short circuit looking at our parent directly
 			 * since we have encapsulated all of its information
 			 */
 			common->filter = parent->filter;
 			common->filterarg = parent->filterarg;
 			common->parent = parent->parent;
 		}
 		common->domain = parent->domain;
 		atomic_add_int(&parent->ref_count, 1);
 	}
 	common->domain = vm_phys_domain_match(common->domain, 0ul,
 	    common->lowaddr);
 	*dmat = common;
 	return (0);
 }
 
 int
 bus_dma_tag_set_domain(bus_dma_tag_t dmat, int domain)
 {
 	struct bus_dma_tag_common *tc;
 
 	tc = (struct bus_dma_tag_common *)dmat;
 	domain = vm_phys_domain_match(domain, 0ul, tc->lowaddr);
 	/* Only call the callback if it changes. */
 	if (domain == tc->domain)
 		return (0);
 	tc->domain = domain;
 	return (tc->impl->tag_set_domain(dmat));
 }
 
 /*
  * Allocate a device specific dma_tag.
  */
 int
 bus_dma_tag_create(bus_dma_tag_t parent, bus_size_t alignment,
     bus_addr_t boundary, bus_addr_t lowaddr, bus_addr_t highaddr,
     bus_dma_filter_t *filter, void *filterarg, bus_size_t maxsize,
     int nsegments, bus_size_t maxsegsz, int flags, bus_dma_lock_t *lockfunc,
     void *lockfuncarg, bus_dma_tag_t *dmat)
 {
 	struct bus_dma_tag_common *tc;
 	int error;
 
 	if (parent == NULL) {
 		error = bus_dma_bounce_impl.tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	} else {
 		tc = (struct bus_dma_tag_common *)parent;
 		error = tc->impl->tag_create(parent, alignment,
 		    boundary, lowaddr, highaddr, filter, filterarg, maxsize,
 		    nsegments, maxsegsz, flags, lockfunc, lockfuncarg, dmat);
 	}
 	return (error);
 }
 
 void
-bus_dma_template_init(bus_dma_tag_template_t *t, bus_dma_tag_t parent)
-{
-
-	if (t == NULL)
-		return;
-
-	t->parent = parent;
-	t->alignment = 1;
-	t->boundary = 0;
-	t->lowaddr = t->highaddr = BUS_SPACE_MAXADDR;
-	t->maxsize = t->maxsegsize = BUS_SPACE_MAXSIZE;
-	t->nsegments = BUS_SPACE_UNRESTRICTED;
-	t->lockfunc = NULL;
-	t->lockfuncarg = NULL;
-	t->flags = 0;
-}
-
-int
-bus_dma_template_tag(bus_dma_tag_template_t *t, bus_dma_tag_t *dmat)
-{
-
-	if (t == NULL || dmat == NULL)
-		return (EINVAL);
-
-	return (bus_dma_tag_create(t->parent, t->alignment, t->boundary,
-	    t->lowaddr, t->highaddr, NULL, NULL, t->maxsize,
-	    t->nsegments, t->maxsegsize, t->flags, t->lockfunc, t->lockfuncarg,
-	    dmat));
-}
-
-void
-bus_dma_template_clone(bus_dma_tag_template_t *t, bus_dma_tag_t dmat)
+bus_dma_template_clone(bus_dma_template_t *t, bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *common;
 
 	if (t == NULL || dmat == NULL)
 		return;
 
 	common = (struct bus_dma_tag_common *)dmat;
 
 	t->parent = (bus_dma_tag_t)common->parent;
 	t->alignment = common->alignment;
 	t->boundary = common->boundary;
 	t->lowaddr = common->lowaddr;
 	t->highaddr = common->highaddr;
 	t->maxsize = common->maxsize;
 	t->nsegments = common->nsegments;
 	t->maxsegsize = common->maxsegsz;
 	t->flags = common->flags;
 	t->lockfunc = common->lockfunc;
 	t->lockfuncarg = common->lockfuncarg;
 }
 
 int
 bus_dma_tag_destroy(bus_dma_tag_t dmat)
 {
 	struct bus_dma_tag_common *tc;
 
 	tc = (struct bus_dma_tag_common *)dmat;
 	return (tc->impl->tag_destroy(dmat));
 }
 
 #ifndef ACPI_DMAR
 bool bus_dma_iommu_set_buswide(device_t dev);
 int bus_dma_iommu_load_ident(bus_dma_tag_t dmat, bus_dmamap_t map,   
     vm_paddr_t start, vm_size_t length, int flags);
 
 bool
 bus_dma_iommu_set_buswide(device_t dev)
 {
 	return (false);
 }
 
 int
 bus_dma_iommu_load_ident(bus_dma_tag_t dmat, bus_dmamap_t map,
     vm_paddr_t start, vm_size_t length, int flags)
 {
 	return (0);
 }
 #endif