diff --git a/sys/netinet/libalias/alias_sctp.c b/sys/netinet/libalias/alias_sctp.c
index da59694a4e16..4a9fb0214e2a 100644
--- a/sys/netinet/libalias/alias_sctp.c
+++ b/sys/netinet/libalias/alias_sctp.c
@@ -1,2737 +1,2737 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause
  *
  * Copyright (c) 2008
  *	Swinburne University of Technology, Melbourne, Australia.
  *
  *  Redistribution and use in source and binary forms, with or without
  *  modification, are permitted provided that the following conditions
  *  are met:
  *  1. Redistributions of source code must retain the above copyright
  *     notice, this list of conditions and the following disclaimer.
  *  2. Redistributions in binary form must reproduce the above copyright
  *     notice, this list of conditions and the following disclaimer in the
  *     documentation and/or other materials provided with the distribution.
  *
  *  THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS "AS IS" AND
  *  ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  *  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  *  ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
  *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  *  DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  *  OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  *  HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  *  LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  *  OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  *  SUCH DAMAGE.
  */
 
 /*
  * Alias_sctp forms part of the libalias kernel module to handle
  * Network Address Translation (NAT) for the SCTP protocol.
  *
  *  This software was developed by David A. Hayes and Jason But
  *
  * The design is outlined in CAIA technical report number  080618A
  * (D. Hayes and J. But, "Alias_sctp Version 0.1: SCTP NAT implementation in IPFW")
  *
  * Development is part of the CAIA SONATA project,
  * proposed by Jason But and Grenville Armitage:
  * http://caia.swin.edu.au/urp/sonata/
  *
  *
  * This project has been made possible in part by a grant from
  * the Cisco University Research Program Fund at Community
  * Foundation Silicon Valley.
  *
  */
 /** @mainpage
  * Alias_sctp is part of the SONATA (http://caia.swin.edu.au/urp/sonata) project
  * to develop and release a BSD licensed implementation of a Network Address
  * Translation (NAT) module that supports the Stream Control Transmission
  * Protocol (SCTP).
  *
  * Traditional address and port number look ups are inadequate for SCTP's
  * operation due to both processing requirements and issues with multi-homing.
  * Alias_sctp integrates with FreeBSD's ipfw/libalias NAT system.
  *
  * Version 0.2 features include:
  * - Support for global multi-homing
  * - Support for ASCONF modification from Internet Draft
  *   (draft-stewart-behave-sctpnat-04, R. Stewart and M. Tuexen, "Stream control
  *   transmission protocol (SCTP) network address translation," Jul. 2008) to
  *   provide support for multi-homed privately addressed hosts
  * - Support for forwarding of T-flagged packets
  * - Generation and delivery of AbortM/ErrorM packets upon detection of NAT
  *   collisions
  * - Per-port forwarding rules
  * - Dynamically controllable logging and statistics
  * - Dynamic management of timers
  * - Dynamic control of hash-table size
  */
 
 /* $FreeBSD$ */
 
 #ifdef _KERNEL
 #include <machine/stdarg.h>
 #include <sys/param.h>
 #include <sys/gsb_crc32.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/module.h>
 #include <sys/syslog.h>
 #include <netinet/libalias/alias_sctp.h>
 #include <netinet/libalias/alias.h>
 #include <netinet/libalias/alias_local.h>
 #include <netinet/sctp_crc32.h>
 #include <machine/in_cksum.h>
 #else
 #include "alias_sctp.h"
 #include <arpa/inet.h>
 #include "alias.h"
 #include "alias_local.h"
 #include <machine/in_cksum.h>
 #include <sys/libkern.h>
 #endif //#ifdef _KERNEL
 
 /* ----------------------------------------------------------------------
  *                          FUNCTION PROTOTYPES
  * ----------------------------------------------------------------------
  */
 /* Packet Parsing Functions */
 static int sctp_PktParser(struct libalias *la, int direction, struct ip *pip,
     struct sctp_nat_msg *sm, struct sctp_nat_assoc **passoc);
 static int GetAsconfVtags(struct libalias *la, struct sctp_nat_msg *sm,
     uint32_t *l_vtag, uint32_t *g_vtag, int direction);
 static int IsASCONFack(struct libalias *la, struct sctp_nat_msg *sm, int direction);
 
 static void AddGlobalIPAddresses(struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc, int direction);
 static int  Add_Global_Address_to_List(struct sctp_nat_assoc *assoc,  struct sctp_GlobalAddress *G_addr);
 static void RmGlobalIPAddresses(struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc, int direction);
 static int IsADDorDEL(struct libalias *la, struct sctp_nat_msg *sm, int direction);
 
 /* State Machine Functions */
 static int ProcessSctpMsg(struct libalias *la, int direction, \
     struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc);
 
 static int ID_process(struct libalias *la, int direction,\
     struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm);
 static int INi_process(struct libalias *la, int direction,\
     struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm);
 static int INa_process(struct libalias *la, int direction,\
     struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm);
 static int UP_process(struct libalias *la, int direction,\
     struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm);
 static int CL_process(struct libalias *la, int direction,\
     struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm);
 static void TxAbortErrorM(struct libalias *la,  struct sctp_nat_msg *sm,\
     struct sctp_nat_assoc *assoc, int sndrply, int direction);
 
 /* Hash Table Functions */
 static struct sctp_nat_assoc *
 FindSctpLocal(struct libalias *la, struct in_addr l_addr, struct in_addr g_addr, uint32_t l_vtag, uint16_t l_port, uint16_t g_port);
 static struct sctp_nat_assoc *
 FindSctpGlobal(struct libalias *la, struct in_addr g_addr, uint32_t g_vtag, uint16_t g_port, uint16_t l_port, int *partial_match);
 static struct sctp_nat_assoc *
 FindSctpGlobalClash(struct libalias *la,  struct sctp_nat_assoc *Cassoc);
 static struct sctp_nat_assoc *
 FindSctpLocalT(struct libalias *la,  struct in_addr g_addr, uint32_t l_vtag, uint16_t g_port, uint16_t l_port);
 static struct sctp_nat_assoc *
 FindSctpGlobalT(struct libalias *la, struct in_addr g_addr, uint32_t g_vtag, uint16_t l_port, uint16_t g_port);
 
 static int AddSctpAssocLocal(struct libalias *la, struct sctp_nat_assoc *assoc, struct in_addr g_addr);
 static int AddSctpAssocGlobal(struct libalias *la, struct sctp_nat_assoc *assoc);
 static void RmSctpAssoc(struct libalias *la, struct sctp_nat_assoc *assoc);
 static void freeGlobalAddressList(struct sctp_nat_assoc *assoc);
 
 /* Timer Queue Functions */
 static void sctp_AddTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc);
 static void sctp_RmTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc);
 static void sctp_ResetTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc, int newexp);
 void sctp_CheckTimers(struct libalias *la);
 
 /* Logging Functions */
 static void logsctperror(char *errormsg, uint32_t vtag, int error, int direction);
 static void logsctpparse(int direction, struct sctp_nat_msg *sm);
 static void logsctpassoc(struct sctp_nat_assoc *assoc, char *s);
 static void logTimerQ(struct libalias *la);
 static void logSctpGlobal(struct libalias *la);
 static void logSctpLocal(struct libalias *la);
 #ifdef _KERNEL
 static void SctpAliasLog(const char *format, ...);
 #endif
 
 /** @defgroup external External code changes and modifications
  *
  * Some changes have been made to files external to alias_sctp.(c|h). These
  * changes are primarily due to code needing to call static functions within
  * those files or to perform extra functionality that can only be performed
  * within these files.
  */
 /** @ingroup external
  * @brief Log current statistics for the libalias instance
  *
  * This function is defined in alias_db.c, since it calls static functions in
  * this file
  *
  * Calls the higher level ShowAliasStats() in alias_db.c which logs all current
  * statistics about the libalias instance - including SCTP statistics
  *
  * @param la Pointer to the libalias instance
  */
 void SctpShowAliasStats(struct libalias *la);
 
 #ifdef _KERNEL
 
 static MALLOC_DEFINE(M_SCTPNAT, "sctpnat", "sctp nat dbs");
 /* Use kernel allocator. */
 #ifdef _SYS_MALLOC_H_
 #define	sn_malloc(x)	malloc(x, M_SCTPNAT, M_NOWAIT|M_ZERO)
 #define	sn_calloc(n,x)	mallocarray((n), (x), M_SCTPNAT, M_NOWAIT|M_ZERO)
 #define	sn_free(x)	free(x, M_SCTPNAT)
 #endif// #ifdef _SYS_MALLOC_H_
 
 #else //#ifdef	_KERNEL
 #define	sn_malloc(x)	malloc(x)
 #define	sn_calloc(n, x)	calloc(n, x)
 #define	sn_free(x)	free(x)
 
 #endif //#ifdef	_KERNEL
 
 /** @defgroup packet_parser SCTP Packet Parsing
  *
  * Macros to:
  * - Return pointers to the first and next SCTP chunks within an SCTP Packet
  * - Define possible return values of the packet parsing process
  * - SCTP message types for storing in the sctp_nat_msg structure @{
  */
 
 #define SN_SCTP_FIRSTCHUNK(sctphead)	(struct sctp_chunkhdr *)(((char *)sctphead) + sizeof(struct sctphdr))
 /**< Returns a pointer to the first chunk in an SCTP packet given a pointer to the SCTP header */
 
 #define SN_SCTP_NEXTCHUNK(chunkhead)	(struct sctp_chunkhdr *)(((char *)chunkhead) + SCTP_SIZE32(ntohs(chunkhead->chunk_length)))
 /**< Returns a pointer to the next chunk in an SCTP packet given a pointer to the current chunk */
 
 #define SN_SCTP_NEXTPARAM(param)	(struct sctp_paramhdr *)(((char *)param) + SCTP_SIZE32(ntohs(param->param_length)))
 /**< Returns a pointer to the next parameter in an SCTP packet given a pointer to the current parameter */
 
 #define SN_MIN_CHUNK_SIZE        4    /**< Smallest possible SCTP chunk size in bytes */
 #define SN_MIN_PARAM_SIZE        4    /**< Smallest possible SCTP param size in bytes */
 #define SN_VTAG_PARAM_SIZE      12    /**< Size of  SCTP ASCONF vtag param in bytes */
 #define SN_ASCONFACK_PARAM_SIZE  8    /**< Size of  SCTP ASCONF ACK param in bytes */
 
 /* Packet parsing return codes */
 #define SN_PARSE_OK                  0    /**< Packet parsed for SCTP messages */
 #define SN_PARSE_ERROR_IPSHL         1    /**< Packet parsing error - IP and SCTP common header len */
 #define SN_PARSE_ERROR_AS_MALLOC     2    /**< Packet parsing error - assoc malloc */
 #define SN_PARSE_ERROR_CHHL          3    /**< Packet parsing error - Chunk header len */
 #define SN_PARSE_ERROR_DIR           4    /**< Packet parsing error - Direction */
 #define SN_PARSE_ERROR_VTAG          5    /**< Packet parsing error - Vtag */
 #define SN_PARSE_ERROR_CHUNK         6    /**< Packet parsing error - Chunk */
 #define SN_PARSE_ERROR_PORT          7    /**< Packet parsing error - Port=0 */
 #define SN_PARSE_ERROR_LOOKUP        8    /**< Packet parsing error - Lookup */
 #define SN_PARSE_ERROR_PARTIALLOOKUP 9    /**< Packet parsing error - partial lookup only found */
 #define SN_PARSE_ERROR_LOOKUP_ABORT  10   /**< Packet parsing error - Lookup - but abort packet */
 
 /* Alias_sctp performs its processing based on a number of key messages */
 #define SN_SCTP_ABORT       0x0000    /**< a packet containing an ABORT chunk */
 #define SN_SCTP_INIT        0x0001    /**< a packet containing an INIT chunk */
 #define SN_SCTP_INITACK     0x0002    /**< a packet containing an INIT-ACK chunk */
 #define SN_SCTP_SHUTCOMP    0x0010    /**< a packet containing a SHUTDOWN-COMPLETE chunk */
 #define SN_SCTP_SHUTACK     0x0020    /**< a packet containing a SHUTDOWN-ACK chunk */
 #define SN_SCTP_ASCONF      0x0100    /**< a packet containing an ASCONF chunk */
 #define SN_SCTP_ASCONFACK   0x0200    /**< a packet containing an ASCONF-ACK chunk */
 #define SN_SCTP_OTHER       0xFFFF    /**< a packet containing a chunk that is not of interest */
 /** @}
  * @defgroup state_machine SCTP NAT State Machine
  *
  * Defines the various states an association can be within the NAT @{
  */
 #define SN_ID  0x0000		/**< Idle state */
 #define SN_INi 0x0010		/**< Initialising, waiting for InitAck state */
 #define SN_INa 0x0020		/**< Initialising, waiting for AddIpAck state */
 #define SN_UP  0x0100		/**< Association in UP state */
 #define SN_CL  0x1000		/**< Closing state */
 #define SN_RM  0x2000		/**< Removing state */
 /** @}
  * @defgroup Logging Logging Functionality
  *
  * Define various log levels and a macro to call specified log functions only if
  * the current log level (sysctl_log_level) matches the specified level @{
  */
 #define	SN_LOG_LOW	  0
 #define SN_LOG_EVENT      1
 #define	SN_LOG_INFO	  2
 #define	SN_LOG_DETAIL	  3
 #define	SN_LOG_DEBUG	  4
 #define	SN_LOG_DEBUG_MAX  5
 
 #define	SN_LOG(level, action)	if (sysctl_log_level >= level) { action; } /**< Perform log action ONLY if the current log level meets the specified log level */
 /** @}
  * @defgroup Hash Hash Table Macros and Functions
  *
  * Defines minimum/maximum/default values for the hash table size @{
  */
 #define SN_MIN_HASH_SIZE        101   /**< Minimum hash table size (set to stop users choosing stupid values) */
 #define SN_MAX_HASH_SIZE    1000001   /**< Maximum hash table size (NB must be less than max int) */
 #define SN_DEFAULT_HASH_SIZE   2003   /**< A reasonable default size for the hash tables */
 
 #define SN_LOCAL_TBL           0x01   /**< assoc in local table */
 #define SN_GLOBAL_TBL          0x02   /**< assoc in global table */
 #define SN_BOTH_TBL            0x03   /**< assoc in both tables */
 #define SN_WAIT_TOLOCAL        0x10   /**< assoc waiting for TOLOCAL asconf ACK*/
 #define SN_WAIT_TOGLOBAL       0x20   /**< assoc waiting for TOLOCAL asconf ACK*/
 #define SN_NULL_TBL            0x00   /**< assoc in No table */
 #define SN_MAX_GLOBAL_ADDRESSES 100   /**< absolute maximum global address count*/
 
 #define SN_ADD_OK                 0   /**< Association added to the table */
 #define SN_ADD_CLASH              1   /**< Clash when trying to add the assoc. info to the table */
 
 #define SN_TABLE_HASH(vtag, port, size) (((u_int) vtag + (u_int) port) % (u_int) size) /**< Calculate the hash table lookup position */
 /** @}
  * @defgroup Timer Timer Queue Macros and Functions
  *
  * Timer macros set minimum/maximum timeout values and calculate timer expiry
  * times for the provided libalias instance @{
  */
 #define SN_MIN_TIMER 1
 #define SN_MAX_TIMER 600
 #define SN_TIMER_QUEUE_SIZE SN_MAX_TIMER+2
 
 #define SN_I_T(la) (LibAliasTime + sysctl_init_timer)       /**< INIT State expiration time in seconds */
 #define SN_U_T(la) (LibAliasTime + sysctl_up_timer)         /**< UP State expiration time in seconds */
 #define SN_C_T(la) (LibAliasTime + sysctl_shutdown_timer)   /**< CL State expiration time in seconds */
 #define SN_X_T(la) (LibAliasTime + sysctl_holddown_timer)   /**< Wait after a shutdown complete in seconds */
 /** @}
  * @defgroup sysctl SysCtl Variable and callback function declarations
  *
  * Sysctl variables to modify NAT functionality in real-time along with associated functions
  * to manage modifications to the sysctl variables @{
  */
 
 /* Callbacks */
 int sysctl_chg_loglevel(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_timer(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_hashtable_size(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_error_on_ootb(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_accept_global_ootb_addip(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_initialising_chunk_proc_limit(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_chunk_proc_limit(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_param_proc_limit(SYSCTL_HANDLER_ARGS);
 int sysctl_chg_track_global_addresses(SYSCTL_HANDLER_ARGS);
 
 /* Sysctl variables */
 /** @brief net.inet.ip.alias.sctp.log_level */
 static u_int sysctl_log_level = 0; /**< Stores the current level of logging */
 /** @brief net.inet.ip.alias.sctp.init_timer */
 static u_int sysctl_init_timer = 15; /**< Seconds to hold an association in the table waiting for an INIT-ACK or AddIP-ACK */
 /** @brief net.inet.ip.alias.sctp.up_timer */
 static u_int sysctl_up_timer = 300; /**< Seconds to hold an association in the table while no packets are transmitted */
 /** @brief net.inet.ip.alias.sctp.shutdown_timer */
 static u_int sysctl_shutdown_timer = 15; /**< Seconds to hold an association in the table waiting for a SHUTDOWN-COMPLETE */
 /** @brief net.inet.ip.alias.sctp.holddown_timer */
 static u_int sysctl_holddown_timer = 0; /**< Seconds to hold an association in the table after it has been shutdown (to allow for lost SHUTDOWN-COMPLETEs) */
 /** @brief net.inet.ip.alias.sctp.hashtable_size */
 static u_int sysctl_hashtable_size = SN_DEFAULT_HASH_SIZE; /**< Sets the hash table size for any NEW NAT instances (existing instances retain their existing Hash Table */
 /** @brief net.inet.ip.alias.sctp.error_on_ootb */
 static u_int sysctl_error_on_ootb = 1; /**< NAT response  to receipt of OOTB packet
 					  (0 - No response, 1 - NAT will send ErrorM only to local side,
 					  2 -  NAT will send local ErrorM and global ErrorM if there was a partial association match
 					  3 - NAT will send ErrorM to both local and global) */
 /** @brief net.inet.ip.alias.sctp.accept_global_ootb_addip */
 static u_int sysctl_accept_global_ootb_addip = 0; /**<NAT responset to receipt of global OOTB AddIP (0 - No response, 1 - NAT will accept OOTB global AddIP messages for processing (Security risk)) */
 /** @brief net.inet.ip.alias.sctp.initialising_chunk_proc_limit */
 static u_int sysctl_initialising_chunk_proc_limit = 2; /**< A limit on the number of chunks that should be searched if there is no matching association (DoS prevention) */
 /** @brief net.inet.ip.alias.sctp.param_proc_limit */
 static u_int sysctl_chunk_proc_limit = 5; /**< A limit on the number of chunks that should be searched (DoS prevention) */
 /** @brief net.inet.ip.alias.sctp.param_proc_limit */
 static u_int sysctl_param_proc_limit = 25; /**< A limit on the number of parameters (in chunks) that should be searched (DoS prevention) */
 /** @brief net.inet.ip.alias.sctp.track_global_addresses */
 static u_int sysctl_track_global_addresses = 0; /**< Configures the global address tracking option within the NAT (0 - Global tracking is disabled, > 0 - enables tracking but limits the number of global IP addresses to this value)
 						   If set to >=1 the NAT will track that many global IP addresses. This may reduce look up table conflicts, but increases processing */
 
 #define SN_NO_ERROR_ON_OOTB              0 /**< Send no errorM on out of the blue packets */
 #define SN_LOCAL_ERROR_ON_OOTB           1 /**< Send only local errorM on out of the blue packets */
 #define SN_LOCALandPARTIAL_ERROR_ON_OOTB 2 /**< Send local errorM and global errorM for out of the blue packets only if partial match found */
 #define SN_ERROR_ON_OOTB                 3 /**< Send errorM on out of the blue packets */
 
 #ifdef SYSCTL_NODE
 
 SYSCTL_DECL(_net_inet);
 SYSCTL_DECL(_net_inet_ip);
 SYSCTL_DECL(_net_inet_ip_alias);
 
 static SYSCTL_NODE(_net_inet_ip_alias, OID_AUTO, sctp,
     CTLFLAG_RW | CTLFLAG_MPSAFE, NULL,
     "SCTP NAT");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, log_level,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_log_level, 0, sysctl_chg_loglevel, "IU",
     "Level of detail (0 - default, 1 - event, 2 - info, 3 - detail, 4 - debug, 5 - max debug)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, init_timer,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_init_timer, 0, sysctl_chg_timer, "IU",
     "Timeout value (s) while waiting for (INIT-ACK|AddIP-ACK)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, up_timer,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_up_timer, 0, sysctl_chg_timer, "IU",
     "Timeout value (s) to keep an association up with no traffic");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, shutdown_timer,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_shutdown_timer, 0, sysctl_chg_timer, "IU",
     "Timeout value (s) while waiting for SHUTDOWN-COMPLETE");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, holddown_timer,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_holddown_timer, 0, sysctl_chg_timer, "IU",
     "Hold association in table for this many seconds after receiving a SHUTDOWN-COMPLETE");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, hashtable_size,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_hashtable_size, 0, sysctl_chg_hashtable_size, "IU",
     "Size of hash tables used for NAT lookups (100 < prime_number > 1000001)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, error_on_ootb,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_error_on_ootb, 0, sysctl_chg_error_on_ootb, "IU",
     "ErrorM sent on receipt of ootb packet:\n\t0 - none,\n"
     "\t1 - to local only,\n"
     "\t2 - to local and global if a partial association match,\n"
     "\t3 - to local and global (DoS risk)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, accept_global_ootb_addip,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_accept_global_ootb_addip, 0, sysctl_chg_accept_global_ootb_addip, "IU",
     "NAT response to receipt of global OOTB AddIP:\n"
     "\t0 - No response,\n"
     "\t1 - NAT will accept OOTB global AddIP messages for processing (Security risk)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, initialising_chunk_proc_limit,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_initialising_chunk_proc_limit, 0,
     sysctl_chg_initialising_chunk_proc_limit, "IU",
     "Number of chunks that should be processed if there is no current "
     "association found:\n\t > 0 (A high value is a DoS risk)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, chunk_proc_limit,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_chunk_proc_limit, 0, sysctl_chg_chunk_proc_limit, "IU",
     "Number of chunks that should be processed to find key chunk:\n"
     "\t>= initialising_chunk_proc_limit (A high value is a DoS risk)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, param_proc_limit,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_param_proc_limit, 0, sysctl_chg_param_proc_limit, "IU",
     "Number of parameters (in a chunk) that should be processed to find key "
     "parameters:\n\t> 1 (A high value is a DoS risk)");
 SYSCTL_PROC(_net_inet_ip_alias_sctp, OID_AUTO, track_global_addresses,
     CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_NEEDGIANT,
     &sysctl_track_global_addresses, 0, sysctl_chg_track_global_addresses, "IU",
     "Configures the global address tracking option within the NAT:\n"
     "\t0 - Global tracking is disabled,\n"
     "\t> 0 - enables tracking but limits the number of global IP addresses to this value");
 
 #endif /* SYSCTL_NODE */
 /** @}
  * @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.fw.sctp.log_level
  *
  * Updates the variable sysctl_log_level to the provided value and ensures
  * it is in the valid range (SN_LOG_LOW -> SN_LOG_DEBUG)
  */
 int sysctl_chg_loglevel(SYSCTL_HANDLER_ARGS)
 {
 	u_int level = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &level, 0, req);
 	if (error)
 		return (error);
 
 	level = (level > SN_LOG_DEBUG_MAX) ? (SN_LOG_DEBUG_MAX) : (level);
 	level = (level < SN_LOG_LOW) ? (SN_LOG_LOW) : (level);
 	sysctl_log_level = level;
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.fw.sctp.(init_timer|up_timer|shutdown_timer)
  *
  * Updates the timer-based sysctl variables. The new values are sanity-checked
  * to make sure that they are within the range SN_MIN_TIMER-SN_MAX_TIMER. The
  * holddown timer is allowed to be 0
  */
 int sysctl_chg_timer(SYSCTL_HANDLER_ARGS)
 {
 	u_int timer = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &timer, 0, req);
 	if (error)
 		return (error);
 
 	timer = (timer > SN_MAX_TIMER) ? (SN_MAX_TIMER) : (timer);
 
 	if (((u_int *)arg1) != &sysctl_holddown_timer) {
 		timer = (timer < SN_MIN_TIMER) ? (SN_MIN_TIMER) : (timer);
 	}
 
 	*(u_int *)arg1 = timer;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.hashtable_size
  *
  * Updates the hashtable_size sysctl variable. The new value should be a prime
  * number.  We sanity check to ensure that the size is within the range
  * SN_MIN_HASH_SIZE-SN_MAX_HASH_SIZE. We then check the provided number to see
  * if it is prime. We approximate by checking that (2,3,5,7,11) are not factors,
  * incrementing the user provided value until we find a suitable number.
  */
 int sysctl_chg_hashtable_size(SYSCTL_HANDLER_ARGS)
 {
 	u_int size = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &size, 0, req);
 	if (error)
 		return (error);
 
 	size = (size < SN_MIN_HASH_SIZE) ? (SN_MIN_HASH_SIZE) : ((size > SN_MAX_HASH_SIZE) ? (SN_MAX_HASH_SIZE) : (size));
 
 	size |= 0x00000001; /* make odd */
 
 	for (;(((size % 3) == 0) || ((size % 5) == 0) || ((size % 7) == 0) || ((size % 11) == 0)); size+=2);
 	sysctl_hashtable_size = size;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.error_on_ootb
  *
  * Updates the error_on_clash sysctl variable.
  * If set to 0, no ErrorM will be sent if there is a look up table clash
  * If set to 1, an ErrorM is sent only to the local side
  * If set to 2, an ErrorM is sent to the local side and global side if there is
  *                                                  a partial association match
  * If set to 3, an ErrorM is sent to both local and global sides (DoS) risk.
  */
 int sysctl_chg_error_on_ootb(SYSCTL_HANDLER_ARGS)
 {
 	u_int flag = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &flag, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_error_on_ootb = (flag > SN_ERROR_ON_OOTB) ? SN_ERROR_ON_OOTB: flag;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.accept_global_ootb_addip
  *
  * If set to 1 the NAT will accept ootb global addip messages for processing (Security risk)
  * Default is 0, only responding to local ootb AddIP messages
  */
 int sysctl_chg_accept_global_ootb_addip(SYSCTL_HANDLER_ARGS)
 {
 	u_int flag = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &flag, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_accept_global_ootb_addip = (flag == 1) ? 1: 0;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.initialising_chunk_proc_limit
  *
  * Updates the initialising_chunk_proc_limit sysctl variable.  Number of chunks
  * that should be processed if there is no current association found: > 0 (A
  * high value is a DoS risk)
  */
 int sysctl_chg_initialising_chunk_proc_limit(SYSCTL_HANDLER_ARGS)
 {
 	u_int proclimit = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &proclimit, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_initialising_chunk_proc_limit = (proclimit < 1) ? 1: proclimit;
 	sysctl_chunk_proc_limit =
 		(sysctl_chunk_proc_limit < sysctl_initialising_chunk_proc_limit) ? sysctl_initialising_chunk_proc_limit : sysctl_chunk_proc_limit;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.chunk_proc_limit
  *
  * Updates the chunk_proc_limit sysctl variable.
  * Number of chunks that should be processed to find key chunk:
  *  >= initialising_chunk_proc_limit (A high value is a DoS risk)
  */
 int sysctl_chg_chunk_proc_limit(SYSCTL_HANDLER_ARGS)
 {
 	u_int proclimit = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &proclimit, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_chunk_proc_limit =
 		(proclimit < sysctl_initialising_chunk_proc_limit) ? sysctl_initialising_chunk_proc_limit : proclimit;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.param_proc_limit
  *
  * Updates the param_proc_limit sysctl variable.
  * Number of parameters that should be processed to find key parameters:
  *  > 1 (A high value is a DoS risk)
  */
 int sysctl_chg_param_proc_limit(SYSCTL_HANDLER_ARGS)
 {
 	u_int proclimit = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &proclimit, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_param_proc_limit =
 		(proclimit < 2) ? 2 : proclimit;
 
 	return (0);
 }
 
 /** @ingroup sysctl
  * @brief sysctl callback for changing net.inet.ip.alias.sctp.track_global_addresses
  *
  *Configures the global address tracking option within the NAT (0 - Global
  *tracking is disabled, > 0 - enables tracking but limits the number of global
  *IP addresses to this value)
  */
 int sysctl_chg_track_global_addresses(SYSCTL_HANDLER_ARGS)
 {
 	u_int num_to_track = *(u_int *)arg1;
 	int error;
 
 	error = sysctl_handle_int(oidp, &num_to_track, 0, req);
 	if (error)
 		return (error);
 
 	sysctl_track_global_addresses = (num_to_track > SN_MAX_GLOBAL_ADDRESSES) ? SN_MAX_GLOBAL_ADDRESSES : num_to_track;
 
 	return (0);
 }
 
 /* ----------------------------------------------------------------------
  *                            CODE BEGINS HERE
  * ----------------------------------------------------------------------
  */
 /**
  * @brief Initialises the SCTP NAT Implementation
  *
  * Creates the look-up tables and the timer queue and initialises all state
  * variables
  *
  * @param la Pointer to the relevant libalias instance
  */
 void
 AliasSctpInit(struct libalias *la)
 {
 	/* Initialise association tables*/
 	int i;
 	la->sctpNatTableSize = sysctl_hashtable_size;
 	SN_LOG(SN_LOG_EVENT,
 	    SctpAliasLog("Initialising SCTP NAT Instance (hash_table_size:%d)\n", la->sctpNatTableSize));
 	la->sctpTableLocal = sn_calloc(la->sctpNatTableSize, sizeof(struct sctpNatTableL));
 	la->sctpTableGlobal = sn_calloc(la->sctpNatTableSize, sizeof(struct sctpNatTableG));
 	la->sctpNatTimer.TimerQ = sn_calloc(SN_TIMER_QUEUE_SIZE, sizeof(struct sctpTimerQ));
 	/* Initialise hash table */
 	for (i = 0; i < la->sctpNatTableSize; i++) {
 		LIST_INIT(&la->sctpTableLocal[i]);
 		LIST_INIT(&la->sctpTableGlobal[i]);
 	}
 
 	/* Initialise circular timer Q*/
 	for (i = 0; i < SN_TIMER_QUEUE_SIZE; i++)
 		LIST_INIT(&la->sctpNatTimer.TimerQ[i]);
 #ifdef _KERNEL
 	la->sctpNatTimer.loc_time=time_uptime; /* LibAliasTime is not set yet */
 #else
 	la->sctpNatTimer.loc_time=LibAliasTime;
 #endif
 	la->sctpNatTimer.cur_loc = 0;
 	la->sctpLinkCount = 0;
 }
 
 /**
  * @brief Cleans-up the SCTP NAT Implementation prior to unloading
  *
  * Removes all entries from the timer queue, freeing associations as it goes.
  * We then free memory allocated to the look-up tables and the time queue
  *
  * NOTE: We do not need to traverse the look-up tables as each association
  *       will always have an entry in the timer queue, freeing this memory
  *       once will free all memory allocated to entries in the look-up tables
  *
  * @param la Pointer to the relevant libalias instance
  */
 void
 AliasSctpTerm(struct libalias *la)
 {
 	struct sctp_nat_assoc *assoc1, *assoc2;
 	int                   i;
 
 	LIBALIAS_LOCK_ASSERT(la);
 	SN_LOG(SN_LOG_EVENT,
 	    SctpAliasLog("Removing SCTP NAT Instance\n"));
 	for (i = 0; i < SN_TIMER_QUEUE_SIZE; i++) {
 		assoc1 = LIST_FIRST(&la->sctpNatTimer.TimerQ[i]);
 		while (assoc1 != NULL) {
 			freeGlobalAddressList(assoc1);
 			assoc2 = LIST_NEXT(assoc1, timer_Q);
 			sn_free(assoc1);
 			assoc1 = assoc2;
 		}
 	}
 
 	sn_free(la->sctpTableLocal);
 	sn_free(la->sctpTableGlobal);
 	sn_free(la->sctpNatTimer.TimerQ);
 }
 
 /**
  * @brief Handles SCTP packets passed from libalias
  *
  * This function needs to actually NAT/drop packets and possibly create and
  * send AbortM or ErrorM packets in response. The process involves:
  * - Validating the direction parameter passed by the caller
  * - Checking and handling any expired timers for the NAT
  * - Calling sctp_PktParser() to parse the packet
  * - Call ProcessSctpMsg() to decide the appropriate outcome and to update
  *   the NAT tables
  * - Based on the return code either:
  *   - NAT the packet
  *   - Construct and send an ErrorM|AbortM packet
  *   - Mark the association for removal from the tables
  * - Potentially remove the association from all lookup tables
  * - Return the appropriate result to libalias
  *
  * @param la Pointer to the relevant libalias instance
  * @param pip Pointer to IP packet to process
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  * @return  PKT_ALIAS_OK | PKT_ALIAS_IGNORE | PKT_ALIAS_ERROR
  */
 int
 SctpAlias(struct libalias *la, struct ip *pip, int direction)
 {
 	int rtnval;
 	struct sctp_nat_msg msg;
 	struct sctp_nat_assoc *assoc = NULL;
 
 	if ((direction != SN_TO_LOCAL) && (direction != SN_TO_GLOBAL)) {
 		SctpAliasLog("ERROR: Invalid direction\n");
 		return (PKT_ALIAS_ERROR);
 	}
 
 	sctp_CheckTimers(la); /* Check timers */
 
 	/* Parse the packet */
 	rtnval = sctp_PktParser(la, direction, pip, &msg, &assoc); //using *char (change to mbuf when get code from paolo)
 	switch (rtnval) {
 	case SN_PARSE_OK:
 		break;
 	case SN_PARSE_ERROR_CHHL:
 		/*
 		 * Not an error, if there is a chunk length parsing error,
 		 * this is a fragmented packet, and we have a valid assoc.
 		 */
 		if ((assoc != NULL) && (ntohs(pip->ip_off) & IP_MF)) {
 			rtnval = SN_PARSE_OK;
 			break;
 		}
 		SN_LOG(SN_LOG_EVENT,
 		    logsctperror("SN_PARSE_ERROR", msg.sctp_hdr->v_tag, rtnval, direction));
 		return (PKT_ALIAS_ERROR);
 	case SN_PARSE_ERROR_PARTIALLOOKUP:
 		if (sysctl_error_on_ootb > SN_LOCALandPARTIAL_ERROR_ON_OOTB) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("SN_PARSE_ERROR", msg.sctp_hdr->v_tag, rtnval, direction));
 			return (PKT_ALIAS_ERROR);
 		}
 	case SN_PARSE_ERROR_LOOKUP:
 		if (sysctl_error_on_ootb == SN_ERROR_ON_OOTB ||
 		    (sysctl_error_on_ootb == SN_LOCALandPARTIAL_ERROR_ON_OOTB && direction == SN_TO_LOCAL) ||
 		    (sysctl_error_on_ootb == SN_LOCAL_ERROR_ON_OOTB && direction == SN_TO_GLOBAL)) {
 			TxAbortErrorM(la, &msg, assoc, SN_REFLECT_ERROR, direction); /*NB assoc=NULL */
 			return (PKT_ALIAS_RESPOND);
 		}
 	default:
 		SN_LOG(SN_LOG_EVENT,
 		    logsctperror("SN_PARSE_ERROR", msg.sctp_hdr->v_tag, rtnval, direction));
 		return (PKT_ALIAS_ERROR);
 	}
 
 	SN_LOG(SN_LOG_DETAIL,
 	    logsctpassoc(assoc, "*");
 	    logsctpparse(direction, &msg);
 	);
 
 	/* Process the SCTP message */
 	rtnval = ProcessSctpMsg(la, direction, &msg, assoc);
 
 	SN_LOG(SN_LOG_DEBUG_MAX,
 	    logsctpassoc(assoc, "-");
 	    logSctpLocal(la);
 	    logSctpGlobal(la);
 	);
 	SN_LOG(SN_LOG_DEBUG, logTimerQ(la));
 
 	switch (rtnval) {
 	case SN_NAT_PKT:
 		switch (direction) {
 		case SN_TO_LOCAL:
 			DifferentialChecksum(&(msg.ip_hdr->ip_sum),
 			    &(assoc->l_addr), &(msg.ip_hdr->ip_dst), 2);
 			msg.ip_hdr->ip_dst = assoc->l_addr; /* change dst address to local address*/
 			break;
 		case SN_TO_GLOBAL:
 			DifferentialChecksum(&(msg.ip_hdr->ip_sum),
 			    &(assoc->a_addr),  &(msg.ip_hdr->ip_src), 2);
 			msg.ip_hdr->ip_src = assoc->a_addr; /* change src to alias addr*/
 			break;
 		default:
 			rtnval = SN_DROP_PKT; /* shouldn't get here, but if it does drop packet */
 			SN_LOG(SN_LOG_LOW, logsctperror("ERROR: Invalid direction", msg.sctp_hdr->v_tag, rtnval, direction));
 			break;
 		}
 		break;
 	case SN_DROP_PKT:
 		SN_LOG(SN_LOG_DETAIL, logsctperror("SN_DROP_PKT", msg.sctp_hdr->v_tag, rtnval, direction));
 		break;
 	case SN_REPLY_ABORT:
 	case SN_REPLY_ERROR:
 	case SN_SEND_ABORT:
 		TxAbortErrorM(la, &msg, assoc, rtnval, direction);
 		break;
 	default:
 		// big error, remove association and go to idle and write log messages
 		SN_LOG(SN_LOG_LOW, logsctperror("SN_PROCESSING_ERROR", msg.sctp_hdr->v_tag, rtnval, direction));
 		assoc->state = SN_RM;/* Mark for removal*/
 		break;
 	}
 
 	/* Remove association if tagged for removal */
 	if (assoc->state == SN_RM) {
 		if (assoc->TableRegister) {
 			sctp_RmTimeOut(la, assoc);
 			RmSctpAssoc(la, assoc);
 		}
 		LIBALIAS_LOCK_ASSERT(la);
 		freeGlobalAddressList(assoc);
 		sn_free(assoc);
 	}
 	switch (rtnval) {
 	case SN_NAT_PKT:
 		return (PKT_ALIAS_OK);
 	case SN_SEND_ABORT:
 		return (PKT_ALIAS_OK);
 	case SN_REPLY_ABORT:
 	case SN_REPLY_ERROR:
 	case SN_REFLECT_ERROR:
 		return (PKT_ALIAS_RESPOND);
 	case SN_DROP_PKT:
 	default:
 		return (PKT_ALIAS_ERROR);
 	}
 }
 
 /**
  * @brief Send an AbortM or ErrorM
  *
  * We construct the new SCTP packet to send in place of the existing packet we
  * have been asked to NAT. This function can only be called if the original
  * packet was successfully parsed as a valid SCTP packet.
  *
  * An AbortM (without cause) packet is the smallest SCTP packet available and as
  * such there is always space in the existing packet buffer to fit the AbortM
  * packet. An ErrorM packet is 4 bytes longer than the (the error cause is not
  * optional). An ErrorM is sent in response to an AddIP when the Vtag/address
  * combination, if added, will produce a conflict in the association look up
  * tables. It may also be used for an unexpected packet - a packet with no
  * matching association in the NAT table and we are requesting an AddIP so we
  * can add it.  The smallest valid SCTP packet while the association is in an
  * up-state is a Heartbeat packet, which is big enough to be transformed to an
  * ErrorM.
  *
  * We create a temporary character array to store the packet as we are constructing
  * it. We then populate the array with appropriate values based on:
  * - Packet type (AbortM | ErrorM)
  * - Initial packet direction (SN_TO_LOCAL | SN_TO_GLOBAL)
  * - NAT response (Send packet | Reply packet)
  *
  * Once complete, we copy the contents of the temporary packet over the original
  * SCTP packet we were asked to NAT
  *
  * @param la Pointer to the relevant libalias instance
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to current association details
  * @param sndrply SN_SEND_ABORT | SN_REPLY_ABORT | SN_REPLY_ERROR
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  */
 static uint32_t
 local_sctp_finalize_crc32(uint32_t crc32c)
 {
 	/* This routine is duplicated from SCTP
 	 * we need to do that since it MAY be that SCTP
 	 * is NOT compiled into the kernel. The CRC32C routines
 	 * however are always available in libkern.
 	 */
 	uint32_t result;
 #if BYTE_ORDER == BIG_ENDIAN
 	uint8_t byte0, byte1, byte2, byte3;
 
 #endif
 	/* Complement the result */
 	result = ~crc32c;
 #if BYTE_ORDER == BIG_ENDIAN
 	/*
 	 * For BIG-ENDIAN.. aka Motorola byte order the result is in
 	 * little-endian form. So we must manually swap the bytes. Then we
 	 * can call htonl() which does nothing...
 	 */
 	byte0 = result & 0x000000ff;
 	byte1 = (result >> 8) & 0x000000ff;
 	byte2 = (result >> 16) & 0x000000ff;
 	byte3 = (result >> 24) & 0x000000ff;
 	crc32c = ((byte0 << 24) | (byte1 << 16) | (byte2 << 8) | byte3);
 #else
 	/*
 	 * For INTEL platforms the result comes out in network order. No
 	 * htonl is required or the swap above. So we optimize out both the
 	 * htonl and the manual swap above.
 	 */
 	crc32c = result;
 #endif
 	return (crc32c);
 }
 
 static void
 TxAbortErrorM(struct libalias *la, struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc, int sndrply, int direction)
 {
 	int sctp_size = sizeof(struct sctphdr) + sizeof(struct sctp_chunkhdr) + sizeof(struct sctp_error_cause);
 	int ip_size = sizeof(struct ip) + sctp_size;
 	int include_error_cause = 1;
 	char tmp_ip[ip_size];
 	char addrbuf[INET_ADDRSTRLEN];
 
 	if (ntohs(sm->ip_hdr->ip_len) < ip_size) { /* short packet, cannot send error cause */
 		include_error_cause = 0;
 		ip_size = ip_size -  sizeof(struct sctp_error_cause);
 		sctp_size = sctp_size -  sizeof(struct sctp_error_cause);
 	}
 	/* Assign header pointers packet */
 	struct ip* ip = (struct ip *) tmp_ip;
 	struct sctphdr* sctp_hdr = (struct sctphdr *) ((char *) ip + sizeof(*ip));
 	struct sctp_chunkhdr* chunk_hdr = (struct sctp_chunkhdr *) ((char *) sctp_hdr + sizeof(*sctp_hdr));
 	struct sctp_error_cause* error_cause = (struct sctp_error_cause *) ((char *) chunk_hdr + sizeof(*chunk_hdr));
 
 	/* construct ip header */
 	ip->ip_v = sm->ip_hdr->ip_v;
 	ip->ip_hl = 5; /* 5*32 bit words */
 	ip->ip_tos = 0;
 	ip->ip_len = htons(ip_size);
 	ip->ip_id = sm->ip_hdr->ip_id;
 	ip->ip_off = 0;
 	ip->ip_ttl = 255;
 	ip->ip_p = IPPROTO_SCTP;
 	/*
 	  The definitions below should be removed when they make it into the SCTP stack
 	*/
 #define SCTP_MIDDLEBOX_FLAG 0x02
 #define SCTP_NAT_TABLE_COLLISION 0x00b0
 #define SCTP_MISSING_NAT 0x00b1
 	chunk_hdr->chunk_type = (sndrply & SN_TX_ABORT) ? SCTP_ABORT_ASSOCIATION : SCTP_OPERATION_ERROR;
 	chunk_hdr->chunk_flags = SCTP_MIDDLEBOX_FLAG;
 	if (include_error_cause) {
 		error_cause->code = htons((sndrply & SN_REFLECT_ERROR) ? SCTP_MISSING_NAT : SCTP_NAT_TABLE_COLLISION);
 		error_cause->length = htons(sizeof(struct sctp_error_cause));
 		chunk_hdr->chunk_length = htons(sizeof(*chunk_hdr) + sizeof(struct sctp_error_cause));
 	} else {
 		chunk_hdr->chunk_length = htons(sizeof(*chunk_hdr));
 	}
 
 	/* set specific values */
 	switch (sndrply) {
 	case SN_REFLECT_ERROR:
 		chunk_hdr->chunk_flags |= SCTP_HAD_NO_TCB; /* set Tbit */
 		sctp_hdr->v_tag = sm->sctp_hdr->v_tag;
 		break;
 	case SN_REPLY_ERROR:
 		sctp_hdr->v_tag = (direction == SN_TO_LOCAL) ? assoc->g_vtag : assoc->l_vtag ;
 		break;
 	case SN_SEND_ABORT:
 		sctp_hdr->v_tag = sm->sctp_hdr->v_tag;
 		break;
 	case SN_REPLY_ABORT:
 		sctp_hdr->v_tag = sm->sctpchnk.Init->initiate_tag;
 		break;
 	}
 
 	/* Set send/reply values */
 	if (sndrply == SN_SEND_ABORT) { /*pass through NAT */
 		ip->ip_src = (direction == SN_TO_LOCAL) ? sm->ip_hdr->ip_src : assoc->a_addr;
 		ip->ip_dst = (direction == SN_TO_LOCAL) ? assoc->l_addr : sm->ip_hdr->ip_dst;
 		sctp_hdr->src_port = sm->sctp_hdr->src_port;
 		sctp_hdr->dest_port = sm->sctp_hdr->dest_port;
 	} else { /* reply and reflect */
 		ip->ip_src = sm->ip_hdr->ip_dst;
 		ip->ip_dst = sm->ip_hdr->ip_src;
 		sctp_hdr->src_port = sm->sctp_hdr->dest_port;
 		sctp_hdr->dest_port = sm->sctp_hdr->src_port;
 	}
 
 	/* Calculate IP header checksum */
 	ip->ip_sum = in_cksum_hdr(ip);
 
 	/* calculate SCTP header CRC32 */
 	sctp_hdr->checksum = 0;
 	sctp_hdr->checksum = local_sctp_finalize_crc32(calculate_crc32c(0xffffffff, (unsigned char *) sctp_hdr, sctp_size));
 
 	memcpy(sm->ip_hdr, ip, ip_size);
 
 	SN_LOG(SN_LOG_EVENT,SctpAliasLog("%s %s 0x%x (->%s:%u vtag=0x%x crc=0x%x)\n",
 	    ((sndrply == SN_SEND_ABORT) ? "Sending" : "Replying"),
 	    ((sndrply & SN_TX_ERROR) ? "ErrorM" : "AbortM"),
 	    (include_error_cause ? ntohs(error_cause->code) : 0),
 	    inet_ntoa_r(ip->ip_dst, INET_NTOA_BUF(addrbuf)),
 	    ntohs(sctp_hdr->dest_port),
 	    ntohl(sctp_hdr->v_tag), ntohl(sctp_hdr->checksum)));
 }
 
 /* ----------------------------------------------------------------------
  *                           PACKET PARSER CODE
  * ----------------------------------------------------------------------
  */
 /** @addtogroup packet_parser
  *
  * These functions parse the SCTP packet and fill a sctp_nat_msg structure
  * with the parsed contents.
  */
 /** @ingroup packet_parser
  * @brief Parses SCTP packets for the key SCTP chunk that will be processed
  *
  * This module parses SCTP packets for the key SCTP chunk that will be processed
  * The module completes the sctp_nat_msg structure and either retrieves the
  * relevant (existing) stored association from the Hash Tables or creates a new
  * association entity with state SN_ID
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param pip
  * @param sm Pointer to sctp message information
  * @param passoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_PARSE_OK | SN_PARSE_ERROR_*
  */
 static int
 sctp_PktParser(struct libalias *la, int direction, struct ip *pip,
     struct sctp_nat_msg *sm, struct sctp_nat_assoc **passoc)
 //sctp_PktParser(int direction, struct mbuf *ipak, int ip_hdr_len,struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc)
 {
 	struct sctphdr *sctp_hdr;
 	struct sctp_chunkhdr *chunk_hdr;
 	struct sctp_paramhdr *param_hdr;
 	struct in_addr ipv4addr;
 	int bytes_left; /* bytes left in ip packet */
 	int chunk_length;
 	int chunk_count;
 	int partial_match = 0;
 	//  mbuf *mp;
 	//  int mlen;
 
 	//  mlen = SCTP_HEADER_LEN(i_pak);
 	//  mp = SCTP_HEADER_TO_CHAIN(i_pak); /* does nothing in bsd since header and chain not separate */
 
 	/*
 	 * Note, that if the VTag is zero, it must be an INIT
 	 * Also, I am only interested in the content of INIT and ADDIP chunks
 	 */
 
 	sm->msg = SN_SCTP_OTHER;/* Initialise to largest value*/
 	sm->chunk_length = 0; /* only care about length for key chunks */
 	// no mbuf stuff from Paolo yet so ...
 	sm->ip_hdr = pip;
 	/* remove ip header length from the bytes_left */
 	bytes_left = ntohs(pip->ip_len) - (pip->ip_hl << 2);
 
 	/* Check SCTP header length and move to first chunk */
 	if (bytes_left < sizeof(struct sctphdr)) {
 		sm->sctp_hdr = NULL;
 		return (SN_PARSE_ERROR_IPSHL); /* packet not long enough*/
 	}
 
 	sm->sctp_hdr = sctp_hdr = (struct sctphdr *) ip_next(pip);
 	bytes_left -= sizeof(struct sctphdr);
 
 	/* Check for valid ports (zero valued ports would find partially initialised associations */
 	if (sctp_hdr->src_port == 0 || sctp_hdr->dest_port == 0)
 		return (SN_PARSE_ERROR_PORT);
 
 	/* Check length of first chunk */
 	if (bytes_left < SN_MIN_CHUNK_SIZE) /* malformed chunk - could cause endless loop*/
 		return (SN_PARSE_ERROR_CHHL); /* packet not long enough for this chunk */
 
 	/* First chunk */
 	chunk_hdr = SN_SCTP_FIRSTCHUNK(sctp_hdr);
 
 	chunk_length = SCTP_SIZE32(ntohs(chunk_hdr->chunk_length));
 	if ((chunk_length < SN_MIN_CHUNK_SIZE) || (chunk_length > bytes_left)) /* malformed chunk - could cause endless loop*/
 		return (SN_PARSE_ERROR_CHHL);
 
 	if ((chunk_hdr->chunk_flags & SCTP_HAD_NO_TCB) &&
 	    ((chunk_hdr->chunk_type == SCTP_ABORT_ASSOCIATION) ||
 		(chunk_hdr->chunk_type == SCTP_SHUTDOWN_COMPLETE))) {
 		/* T-Bit set */
 		if (direction == SN_TO_LOCAL)
 			*passoc = FindSctpGlobalT(la,  pip->ip_src, sctp_hdr->v_tag, sctp_hdr->dest_port, sctp_hdr->src_port);
 		else
 			*passoc = FindSctpLocalT(la, pip->ip_dst, sctp_hdr->v_tag, sctp_hdr->dest_port, sctp_hdr->src_port);
 	} else {
 		/* Proper v_tag settings */
 		if (direction == SN_TO_LOCAL)
 			*passoc = FindSctpGlobal(la, pip->ip_src, sctp_hdr->v_tag, sctp_hdr->src_port, sctp_hdr->dest_port, &partial_match);
 		else
 			*passoc = FindSctpLocal(la, pip->ip_src,  pip->ip_dst, sctp_hdr->v_tag, sctp_hdr->src_port, sctp_hdr->dest_port);
 	}
 
 	chunk_count = 1;
 	/* Real packet parsing occurs below */
 	while (IS_SCTP_CONTROL(chunk_hdr)) {
 		switch (chunk_hdr->chunk_type) {
 		case SCTP_INITIATION:
 			if (chunk_length < sizeof(struct sctp_init_chunk)) /* malformed chunk*/
 				return (SN_PARSE_ERROR_CHHL);
 			sm->msg = SN_SCTP_INIT;
 			sm->sctpchnk.Init = (struct sctp_init *) ((char *) chunk_hdr + sizeof(struct sctp_chunkhdr));
 			sm->chunk_length = chunk_length;
 			/* if no existing association, create a new one */
 			if (*passoc == NULL) {
 				if (sctp_hdr->v_tag == 0) { //Init requires vtag=0
 					*passoc = (struct sctp_nat_assoc *) sn_malloc(sizeof(struct sctp_nat_assoc));
 					if (*passoc == NULL) {/* out of resources */
 						return (SN_PARSE_ERROR_AS_MALLOC);
 					}
 					/* Initialize association - sn_malloc initializes memory to zeros */
 					(*passoc)->state = SN_ID;
 					LIST_INIT(&((*passoc)->Gaddr)); /* always initialise to avoid memory problems */
 					(*passoc)->TableRegister = SN_NULL_TBL;
 					return (SN_PARSE_OK);
 				}
 				return (SN_PARSE_ERROR_VTAG);
 			}
 			return (SN_PARSE_ERROR_LOOKUP);
 		case SCTP_INITIATION_ACK:
 			if (chunk_length < sizeof(struct sctp_init_ack_chunk)) /* malformed chunk*/
 				return (SN_PARSE_ERROR_CHHL);
 			sm->msg = SN_SCTP_INITACK;
 			sm->sctpchnk.InitAck = (struct sctp_init_ack *) ((char *) chunk_hdr + sizeof(struct sctp_chunkhdr));
 			sm->chunk_length = chunk_length;
 			return ((*passoc == NULL) ? (SN_PARSE_ERROR_LOOKUP) : (SN_PARSE_OK));
 		case SCTP_ABORT_ASSOCIATION: /* access only minimum sized chunk */
 			sm->msg = SN_SCTP_ABORT;
 			sm->chunk_length = chunk_length;
 			return ((*passoc == NULL) ? (SN_PARSE_ERROR_LOOKUP_ABORT) : (SN_PARSE_OK));
 		case SCTP_SHUTDOWN_ACK:
 			if (chunk_length < sizeof(struct sctp_shutdown_ack_chunk)) /* malformed chunk*/
 				return (SN_PARSE_ERROR_CHHL);
 			if (sm->msg > SN_SCTP_SHUTACK) {
 				sm->msg = SN_SCTP_SHUTACK;
 				sm->chunk_length = chunk_length;
 			}
 			break;
 		case SCTP_SHUTDOWN_COMPLETE:  /* minimum sized chunk */
 			if (sm->msg > SN_SCTP_SHUTCOMP) {
 				sm->msg = SN_SCTP_SHUTCOMP;
 				sm->chunk_length = chunk_length;
 			}
 			return ((*passoc == NULL) ? (SN_PARSE_ERROR_LOOKUP) : (SN_PARSE_OK));
 		case SCTP_ASCONF:
 			if (sm->msg > SN_SCTP_ASCONF) {
 				if (chunk_length < (sizeof(struct  sctp_asconf_chunk) + sizeof(struct  sctp_ipv4addr_param))) /* malformed chunk*/
 					return (SN_PARSE_ERROR_CHHL);
 				//leave parameter searching to later, if required
 				param_hdr = (struct sctp_paramhdr *) ((char *) chunk_hdr + sizeof(struct sctp_asconf_chunk)); /*compulsory IP parameter*/
 				if (ntohs(param_hdr->param_type) == SCTP_IPV4_ADDRESS) {
 					if ((*passoc == NULL) && (direction == SN_TO_LOCAL)) { /* AddIP with no association */
 						/* try look up with the ASCONF packet's alternative address */
 						ipv4addr.s_addr = ((struct sctp_ipv4addr_param *) param_hdr)->addr;
 						*passoc = FindSctpGlobal(la, ipv4addr, sctp_hdr->v_tag, sctp_hdr->src_port, sctp_hdr->dest_port, &partial_match);
 					}
 					param_hdr = (struct sctp_paramhdr *)
 						((char *) param_hdr + sizeof(struct sctp_ipv4addr_param)); /*asconf's compulsory address parameter */
 					sm->chunk_length = chunk_length - sizeof(struct  sctp_asconf_chunk) - sizeof(struct  sctp_ipv4addr_param); /* rest of chunk */
 				} else {
 					if (chunk_length < (sizeof(struct  sctp_asconf_chunk) + sizeof(struct  sctp_ipv6addr_param))) /* malformed chunk*/
 						return (SN_PARSE_ERROR_CHHL);
 					param_hdr = (struct sctp_paramhdr *)
 						((char *) param_hdr + sizeof(struct sctp_ipv6addr_param)); /*asconf's compulsory address parameter */
 					sm->chunk_length = chunk_length - sizeof(struct  sctp_asconf_chunk) - sizeof(struct  sctp_ipv6addr_param); /* rest of chunk */
 				}
 				sm->msg = SN_SCTP_ASCONF;
 				sm->sctpchnk.Asconf = param_hdr;
 
 				if (*passoc == NULL) { /* AddIP with no association */
 					*passoc = (struct sctp_nat_assoc *) sn_malloc(sizeof(struct sctp_nat_assoc));
 					if (*passoc == NULL) {/* out of resources */
 						return (SN_PARSE_ERROR_AS_MALLOC);
 					}
 					/* Initialize association  - sn_malloc initializes memory to zeros */
 					(*passoc)->state = SN_ID;
 					LIST_INIT(&((*passoc)->Gaddr)); /* always initialise to avoid memory problems */
 					(*passoc)->TableRegister = SN_NULL_TBL;
 					return (SN_PARSE_OK);
 				}
 			}
 			break;
 		case SCTP_ASCONF_ACK:
 			if (sm->msg > SN_SCTP_ASCONFACK) {
 				if (chunk_length < sizeof(struct  sctp_asconf_ack_chunk)) /* malformed chunk*/
 					return (SN_PARSE_ERROR_CHHL);
 				//leave parameter searching to later, if required
 				param_hdr = (struct sctp_paramhdr *) ((char *) chunk_hdr
 				    + sizeof(struct sctp_asconf_ack_chunk));
 				sm->msg = SN_SCTP_ASCONFACK;
 				sm->sctpchnk.Asconf = param_hdr;
 				sm->chunk_length = chunk_length - sizeof(struct sctp_asconf_ack_chunk);
 			}
 			break;
 		default:
 			break; /* do nothing*/
 		}
 
 		/* if no association is found exit - we need to find an Init or AddIP within sysctl_initialising_chunk_proc_limit */
 		if ((*passoc == NULL) && (chunk_count >= sysctl_initialising_chunk_proc_limit))
 			return (SN_PARSE_ERROR_LOOKUP);
 
 		/* finished with this chunk, on to the next chunk*/
 		bytes_left-= chunk_length;
 
 		/* Is this the end of the packet ? */
 		if (bytes_left == 0)
 			return (*passoc == NULL) ? (SN_PARSE_ERROR_LOOKUP) : (SN_PARSE_OK);
 
 		/* Are there enough bytes in packet to at least retrieve length of next chunk ? */
 		if (bytes_left < SN_MIN_CHUNK_SIZE)
 			return (SN_PARSE_ERROR_CHHL);
 
 		chunk_hdr = SN_SCTP_NEXTCHUNK(chunk_hdr);
 
 		/* Is the chunk long enough to not cause endless look and are there enough bytes in packet to read the chunk ? */
 		chunk_length = SCTP_SIZE32(ntohs(chunk_hdr->chunk_length));
 		if ((chunk_length < SN_MIN_CHUNK_SIZE) || (chunk_length > bytes_left))
 			return (SN_PARSE_ERROR_CHHL);
 		if (++chunk_count > sysctl_chunk_proc_limit)
 			return (SN_PARSE_OK); /* limit for processing chunks, take what we get */
 	}
 
 	if (*passoc == NULL)
 		return (partial_match) ? (SN_PARSE_ERROR_PARTIALLOOKUP) : (SN_PARSE_ERROR_LOOKUP);
 	else
 		return (SN_PARSE_OK);
 }
 
 /** @ingroup packet_parser
  * @brief Extract Vtags from Asconf Chunk
  *
  * GetAsconfVtags scans an Asconf Chunk for the vtags parameter, and then
  * extracts the vtags.
  *
  * GetAsconfVtags is not called from within sctp_PktParser. It is called only
  * from within ID_process when an AddIP has been received.
  *
  * @param la Pointer to the relevant libalias instance
  * @param sm Pointer to sctp message information
  * @param l_vtag Pointer to the local vtag in the association this SCTP Message belongs to
  * @param g_vtag Pointer to the local vtag in the association this SCTP Message belongs to
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  * @return 1 - success | 0 - fail
  */
 static int
 GetAsconfVtags(struct libalias *la, struct sctp_nat_msg *sm, uint32_t *l_vtag, uint32_t *g_vtag, int direction)
 {
 	/* To be removed when information is in the sctp headers */
 #define SCTP_VTAG_PARAM 0xC007
 	struct sctp_vtag_param {
 		struct sctp_paramhdr ph;/* type=SCTP_VTAG_PARAM */
 		uint32_t local_vtag;
 		uint32_t remote_vtag;
 	} __attribute__((packed));
 
 	struct sctp_vtag_param *vtag_param;
 	struct sctp_paramhdr *param;
 	int bytes_left;
 	int param_size;
 	int param_count;
 
 	param_count = 1;
 	param = sm->sctpchnk.Asconf;
 	param_size = SCTP_SIZE32(ntohs(param->param_length));
 	bytes_left = sm->chunk_length;
 	/* step through Asconf parameters */
 	while((bytes_left >= param_size) && (bytes_left >= SN_VTAG_PARAM_SIZE)) {
 		if (ntohs(param->param_type) == SCTP_VTAG_PARAM) {
 			vtag_param = (struct sctp_vtag_param *) param;
 			switch (direction) {
 				/* The Internet draft is a little ambigious as to order of these vtags.
 				   We think it is this way around. If we are wrong, the order will need
 				   to be changed. */
 			case SN_TO_GLOBAL:
 				*g_vtag = vtag_param->local_vtag;
 				*l_vtag = vtag_param->remote_vtag;
 				break;
 			case SN_TO_LOCAL:
 				*g_vtag = vtag_param->remote_vtag;
 				*l_vtag = vtag_param->local_vtag;
 				break;
 			}
 			return (1); /* found */
 		}
 
 		bytes_left -= param_size;
 		if (bytes_left < SN_MIN_PARAM_SIZE)
 			return (0);
 
 		param = SN_SCTP_NEXTPARAM(param);
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 		if (++param_count > sysctl_param_proc_limit) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("Parameter parse limit exceeded (GetAsconfVtags)",
 				sm->sctp_hdr->v_tag, sysctl_param_proc_limit, direction));
 			return (0); /* not found limit exceeded*/
 		}
 	}
 	return (0); /* not found */
 }
 
 /** @ingroup packet_parser
  * @brief AddGlobalIPAddresses from Init,InitAck,or AddIP packets
  *
  * AddGlobalIPAddresses scans an SCTP chunk (in sm) for Global IP addresses, and
  * adds them.
  *
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  */
 static void
 AddGlobalIPAddresses(struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc, int direction)
 {
 	struct sctp_ipv4addr_param *ipv4_param;
 	struct sctp_paramhdr *param = NULL;
 	struct sctp_GlobalAddress *G_Addr;
 	struct in_addr g_addr = {0};
 	int bytes_left = 0;
 	int param_size;
 	int param_count, addr_param_count = 0;
 
 	switch (direction) {
 	case SN_TO_GLOBAL: /* does not contain global addresses */
 		g_addr = sm->ip_hdr->ip_dst;
 		bytes_left = 0; /* force exit */
 		break;
 	case SN_TO_LOCAL:
 		g_addr = sm->ip_hdr->ip_src;
 		param_count = 1;
 		switch (sm->msg) {
 		case SN_SCTP_INIT:
 			bytes_left = sm->chunk_length - sizeof(struct sctp_init_chunk);
 			param = (struct sctp_paramhdr *)((char *)sm->sctpchnk.Init + sizeof(struct sctp_init));
 			break;
 		case SN_SCTP_INITACK:
 			bytes_left = sm->chunk_length - sizeof(struct sctp_init_ack_chunk);
 			param = (struct sctp_paramhdr *)((char *)sm->sctpchnk.InitAck + sizeof(struct sctp_init_ack));
 			break;
 		case SN_SCTP_ASCONF:
 			bytes_left = sm->chunk_length;
 			param = sm->sctpchnk.Asconf;
 			break;
 		}
 	}
 	if (bytes_left >= SN_MIN_PARAM_SIZE)
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 	else
 		param_size = bytes_left+1; /* force skip loop */
 
 	if ((assoc->state == SN_ID) && ((sm->msg == SN_SCTP_INIT) || (bytes_left < SN_MIN_PARAM_SIZE))) {/* add pkt address */
 		G_Addr = (struct sctp_GlobalAddress *) sn_malloc(sizeof(struct sctp_GlobalAddress));
 		if (G_Addr == NULL) {/* out of resources */
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("AddGlobalIPAddress: No resources for adding global address - revert to no tracking",
 				sm->sctp_hdr->v_tag,  0, direction));
 			assoc->num_Gaddr = 0; /* don't track any more for this assoc*/
 			sysctl_track_global_addresses=0;
 			return;
 		}
 		G_Addr->g_addr = g_addr;
 		if (!Add_Global_Address_to_List(assoc, G_Addr))
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("AddGlobalIPAddress: Address already in list",
 				sm->sctp_hdr->v_tag,  assoc->num_Gaddr, direction));
 	}
 
 	/* step through parameters */
 	while((bytes_left >= param_size) && (bytes_left >= sizeof(struct sctp_ipv4addr_param))) {
 		if (assoc->num_Gaddr >= sysctl_track_global_addresses) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("AddGlobalIPAddress: Maximum Number of addresses reached",
 				sm->sctp_hdr->v_tag,  sysctl_track_global_addresses, direction));
 			return;
 		}
 		switch (ntohs(param->param_type)) {
 		case SCTP_ADD_IP_ADDRESS:
 			/* skip to address parameter - leave param_size so bytes left will be calculated properly*/
 			param = (struct sctp_paramhdr *) &((struct sctp_asconf_addrv4_param *) param)->addrp;
 			/* FALLTHROUGH */
 		case SCTP_IPV4_ADDRESS:
 			ipv4_param = (struct sctp_ipv4addr_param *) param;
 			/* add addresses to association */
 			G_Addr = (struct sctp_GlobalAddress *) sn_malloc(sizeof(struct sctp_GlobalAddress));
 			if (G_Addr == NULL) {/* out of resources */
 				SN_LOG(SN_LOG_EVENT,
 				    logsctperror("AddGlobalIPAddress: No resources for adding global address - revert to no tracking",
 					sm->sctp_hdr->v_tag,  0, direction));
 				assoc->num_Gaddr = 0; /* don't track any more for this assoc*/
 				sysctl_track_global_addresses=0;
 				return;
 			}
 			/* add address */
 			addr_param_count++;
 			if ((sm->msg == SN_SCTP_ASCONF) && (ipv4_param->addr == INADDR_ANY)) { /* use packet address */
 				G_Addr->g_addr = g_addr;
 				if (!Add_Global_Address_to_List(assoc, G_Addr))
 					SN_LOG(SN_LOG_EVENT,
 					    logsctperror("AddGlobalIPAddress: Address already in list",
 						sm->sctp_hdr->v_tag,  assoc->num_Gaddr, direction));
 				return; /*shouldn't be any other addresses if the zero address is given*/
 			} else {
 				G_Addr->g_addr.s_addr = ipv4_param->addr;
 				if (!Add_Global_Address_to_List(assoc, G_Addr))
 					SN_LOG(SN_LOG_EVENT,
 					    logsctperror("AddGlobalIPAddress: Address already in list",
 						sm->sctp_hdr->v_tag,  assoc->num_Gaddr, direction));
 			}
 		}
 
 		bytes_left -= param_size;
 		if (bytes_left < SN_MIN_PARAM_SIZE)
 			break;
 
 		param = SN_SCTP_NEXTPARAM(param);
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 		if (++param_count > sysctl_param_proc_limit) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("Parameter parse limit exceeded (AddGlobalIPAddress)",
 				sm->sctp_hdr->v_tag, sysctl_param_proc_limit, direction));
 			break; /* limit exceeded*/
 		}
 	}
 	if (addr_param_count == 0) {
 		SN_LOG(SN_LOG_DETAIL,
 		    logsctperror("AddGlobalIPAddress: no address parameters to add",
 			sm->sctp_hdr->v_tag, assoc->num_Gaddr, direction));
 	}
 }
 
 /**
  * @brief Add_Global_Address_to_List
  *
  * Adds a global IP address to an associations address list, if it is not
  * already there.  The first address added us usually the packet's address, and
  * is most likely to be used, so it is added at the beginning. Subsequent
  * addresses are added after this one.
  *
  * @param assoc Pointer to the association this SCTP Message belongs to
  * @param G_addr Pointer to the global address to add
  *
  * @return 1 - success | 0 - fail
  */
 static int
 Add_Global_Address_to_List(struct sctp_nat_assoc *assoc,  struct sctp_GlobalAddress *G_addr)
 {
 	struct sctp_GlobalAddress *iter_G_Addr = NULL, *first_G_Addr = NULL;
 	first_G_Addr = LIST_FIRST(&(assoc->Gaddr));
 	if (first_G_Addr == NULL) {
 		LIST_INSERT_HEAD(&(assoc->Gaddr), G_addr, list_Gaddr); /* add new address to beginning of list*/
 	} else {
 		LIST_FOREACH(iter_G_Addr, &(assoc->Gaddr), list_Gaddr) {
 			if (G_addr->g_addr.s_addr == iter_G_Addr->g_addr.s_addr)
 				return (0); /* already exists, so don't add */
 		}
 		LIST_INSERT_AFTER(first_G_Addr, G_addr, list_Gaddr); /* add address to end of list*/
 	}
 	assoc->num_Gaddr++;
 	return (1); /* success */
 }
 
 /** @ingroup packet_parser
  * @brief RmGlobalIPAddresses from DelIP packets
  *
  * RmGlobalIPAddresses scans an ASCONF chunk for DelIP parameters to remove the
  * given Global IP addresses from the association. It will not delete the
  * the address if it is a list of one address.
  *
  *
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  */
 static void
 RmGlobalIPAddresses(struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc, int direction)
 {
 	struct sctp_asconf_addrv4_param *asconf_ipv4_param;
 	struct sctp_paramhdr *param;
 	struct sctp_GlobalAddress *G_Addr, *G_Addr_tmp;
 	int bytes_left;
 	int param_size;
 	int param_count;
 
 	bytes_left = sm->chunk_length;
 	param_count = 1;
 	param = sm->sctpchnk.Asconf;
 	if (bytes_left >= SN_MIN_PARAM_SIZE) {
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 	} else {
 		SN_LOG(SN_LOG_EVENT,
 		    logsctperror("RmGlobalIPAddress: truncated packet - cannot remove IP addresses",
 			sm->sctp_hdr->v_tag, sysctl_track_global_addresses, direction));
 		return;
 	}
 
 	/* step through Asconf parameters */
 	while((bytes_left >= param_size) && (bytes_left >= sizeof(struct sctp_ipv4addr_param))) {
 		if (ntohs(param->param_type) == SCTP_DEL_IP_ADDRESS) {
 			asconf_ipv4_param = (struct sctp_asconf_addrv4_param *) param;
 			if (asconf_ipv4_param->addrp.addr == INADDR_ANY) { /* remove all bar pkt address */
 				LIST_FOREACH_SAFE(G_Addr, &(assoc->Gaddr), list_Gaddr, G_Addr_tmp) {
 					if (G_Addr->g_addr.s_addr != sm->ip_hdr->ip_src.s_addr) {
 						if (assoc->num_Gaddr > 1) { /* only delete if more than one */
 							LIST_REMOVE(G_Addr, list_Gaddr);
 							sn_free(G_Addr);
 							assoc->num_Gaddr--;
 						} else {
 							SN_LOG(SN_LOG_EVENT,
 							    logsctperror("RmGlobalIPAddress: Request to remove last IP address (didn't)",
 								sm->sctp_hdr->v_tag, assoc->num_Gaddr, direction));
 						}
 					}
 				}
 				return; /*shouldn't be any other addresses if the zero address is given*/
 			} else {
 				LIST_FOREACH_SAFE(G_Addr, &(assoc->Gaddr), list_Gaddr, G_Addr_tmp) {
 					if (G_Addr->g_addr.s_addr == asconf_ipv4_param->addrp.addr) {
 						if (assoc->num_Gaddr > 1) { /* only delete if more than one */
 							LIST_REMOVE(G_Addr, list_Gaddr);
 							sn_free(G_Addr);
 							assoc->num_Gaddr--;
 							break; /* Since add only adds new addresses, there should be no double entries */
 						} else {
 							SN_LOG(SN_LOG_EVENT,
 							    logsctperror("RmGlobalIPAddress: Request to remove last IP address (didn't)",
 								sm->sctp_hdr->v_tag, assoc->num_Gaddr, direction));
 						}
 					}
 				}
 			}
 		}
 		bytes_left -= param_size;
 		if (bytes_left == 0)
 			return;
 		else if (bytes_left < SN_MIN_PARAM_SIZE) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("RmGlobalIPAddress: truncated packet - may not have removed all IP addresses",
 				sm->sctp_hdr->v_tag, sysctl_track_global_addresses, direction));
 			return;
 		}
 
 		param = SN_SCTP_NEXTPARAM(param);
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 		if (++param_count > sysctl_param_proc_limit) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("Parameter parse limit exceeded (RmGlobalIPAddress)",
 				sm->sctp_hdr->v_tag, sysctl_param_proc_limit, direction));
 			return; /* limit exceeded*/
 		}
 	}
 }
 
 /**  @ingroup packet_parser
  * @brief Check that ASCONF was successful
  *
  * Each ASCONF configuration parameter carries a correlation ID which should be
  * matched with an ASCONFack. This is difficult for a NAT, since every
  * association could potentially have a number of outstanding ASCONF
  * configuration parameters, which should only be activated on receipt of the
  * ACK.
  *
  * Currently we only look for an ACK when the NAT is setting up a new
  * association (ie AddIP for a connection that the NAT does not know about
  * because the original Init went through a public interface or another NAT)
  * Since there is currently no connection on this path, there should be no other
  * ASCONF configuration parameters outstanding, so we presume that if there is
  * an ACK that it is responding to the AddIP and activate the new association.
  *
  * @param la Pointer to the relevant libalias instance
  * @param sm Pointer to sctp message information
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  * @return 1 - success | 0 - fail
  */
 static int
 IsASCONFack(struct libalias *la, struct sctp_nat_msg *sm, int direction)
 {
 	struct sctp_paramhdr *param;
 	int bytes_left;
 	int param_size;
 	int param_count;
 
 	param_count = 1;
 	param = sm->sctpchnk.Asconf;
 	param_size = SCTP_SIZE32(ntohs(param->param_length));
 	if (param_size == 8)
 		return (1); /*success - default acknowledgement of everything */
 
 	bytes_left = sm->chunk_length;
 	if (bytes_left < param_size)
 		return (0); /* not found */
 	/* step through Asconf parameters */
 	while(bytes_left >= SN_ASCONFACK_PARAM_SIZE) {
 		if (ntohs(param->param_type) == SCTP_SUCCESS_REPORT)
 			return (1); /* success - but can't match correlation IDs - should only be one */
 		/* check others just in case */
 		bytes_left -= param_size;
 		if (bytes_left >= SN_MIN_PARAM_SIZE)
 			param = SN_SCTP_NEXTPARAM(param);
 		else
 			return (0);
 
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 		if (bytes_left < param_size)
 			return (0);
 
 		if (++param_count > sysctl_param_proc_limit) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("Parameter parse limit exceeded (IsASCONFack)",
 				sm->sctp_hdr->v_tag, sysctl_param_proc_limit, direction));
 			return (0); /* not found limit exceeded*/
 		}
 	}
 	return (0); /* not success */
 }
 
 /**  @ingroup packet_parser
  * @brief Check to see if ASCONF contains an Add IP or Del IP parameter
  *
  * IsADDorDEL scans an ASCONF packet to see if it contains an AddIP or DelIP
  * parameter
  *
  * @param la Pointer to the relevant libalias instance
  * @param sm Pointer to sctp message information
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  *
  * @return SCTP_ADD_IP_ADDRESS | SCTP_DEL_IP_ADDRESS | 0 - fail
  */
 static int
 IsADDorDEL(struct libalias *la, struct sctp_nat_msg *sm, int direction)
 {
 	struct sctp_paramhdr *param;
 	int bytes_left;
 	int param_size;
 	int param_count;
 
 	param_count = 1;
 	param = sm->sctpchnk.Asconf;
 	param_size = SCTP_SIZE32(ntohs(param->param_length));
 
 	bytes_left = sm->chunk_length;
 	if (bytes_left < param_size)
 		return (0); /* not found */
 	/* step through Asconf parameters */
 	while(bytes_left >= SN_ASCONFACK_PARAM_SIZE) {
 		if (ntohs(param->param_type) == SCTP_ADD_IP_ADDRESS)
 			return (SCTP_ADD_IP_ADDRESS);
 		else if (ntohs(param->param_type) == SCTP_DEL_IP_ADDRESS)
 			return (SCTP_DEL_IP_ADDRESS);
 		/* check others just in case */
 		bytes_left -= param_size;
 		if (bytes_left >= SN_MIN_PARAM_SIZE)
 			param = SN_SCTP_NEXTPARAM(param);
 		else
 			return (0); /*Neither found */
 
 		param_size = SCTP_SIZE32(ntohs(param->param_length));
 		if (bytes_left < param_size)
 			return (0);
 
 		if (++param_count > sysctl_param_proc_limit) {
 			SN_LOG(SN_LOG_EVENT,
 			    logsctperror("Parameter parse limit exceeded IsADDorDEL)",
 				sm->sctp_hdr->v_tag, sysctl_param_proc_limit, direction));
 			return (0); /* not found limit exceeded*/
 		}
 	}
 	return (0);  /*Neither found */
 }
 
 /* ----------------------------------------------------------------------
  *                            STATE MACHINE CODE
  * ----------------------------------------------------------------------
  */
 /** @addtogroup state_machine
  *
  * The SCTP NAT State Machine functions will:
  * - Process an already parsed packet
  * - Use the existing NAT Hash Tables
  * - Determine the next state for the association
  * - Update the NAT Hash Tables and Timer Queues
  * - Return the appropriate action to take with the packet
  */
 /** @ingroup state_machine
  * @brief Process SCTP message
  *
  * This function is the base state machine. It calls the processing engine for
  * each state.
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_DROP_PKT | SN_NAT_PKT | SN_REPLY_ABORT | SN_REPLY_ERROR | SN_PROCESSING_ERROR
  */
 static int
 ProcessSctpMsg(struct libalias *la, int direction, struct sctp_nat_msg *sm, struct sctp_nat_assoc *assoc)
 {
 	int rtnval;
 
 	switch (assoc->state) {
 	case SN_ID: /* Idle */
 		rtnval = ID_process(la, direction, assoc, sm);
 		if (rtnval != SN_NAT_PKT) {
 			assoc->state = SN_RM;/* Mark for removal*/
 		}
 		return (rtnval);
 	case SN_INi: /* Initialising - Init */
 		return (INi_process(la, direction, assoc, sm));
 	case SN_INa: /* Initialising - AddIP */
 		return (INa_process(la, direction, assoc, sm));
 	case SN_UP:  /* Association UP */
 		return (UP_process(la, direction, assoc, sm));
 	case SN_CL:  /* Association Closing */
 		return (CL_process(la, direction, assoc, sm));
 	}
 	return (SN_PROCESSING_ERROR);
 }
 
 /** @ingroup state_machine
  * @brief Process SCTP message while in the Idle state
  *
  * This function looks for an Incoming INIT or AddIP message.
  *
  * All other SCTP messages are invalid when in SN_ID, and are dropped.
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_NAT_PKT | SN_DROP_PKT | SN_REPLY_ABORT | SN_REPLY_ERROR
  */
 static int
 ID_process(struct libalias *la, int direction, struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm)
 {
 	switch (sm->msg) {
 	case SN_SCTP_ASCONF:           /* a packet containing an ASCONF chunk with ADDIP */
 		if (!sysctl_accept_global_ootb_addip && (direction == SN_TO_LOCAL))
 			return (SN_DROP_PKT);
 		/* if this Asconf packet does not contain the Vtag parameters it is of no use in Idle state */
 		if (!GetAsconfVtags(la, sm, &(assoc->l_vtag), &(assoc->g_vtag), direction))
 			return (SN_DROP_PKT);
 		/* FALLTHROUGH */
 	case SN_SCTP_INIT:            /* a packet containing an INIT chunk or an ASCONF AddIP */
 		if (sysctl_track_global_addresses)
 			AddGlobalIPAddresses(sm, assoc, direction);
 		switch (direction) {
 		case SN_TO_GLOBAL:
 			assoc->l_addr = sm->ip_hdr->ip_src;
 			assoc->a_addr = FindAliasAddress(la, assoc->l_addr);
 			assoc->l_port = sm->sctp_hdr->src_port;
 			assoc->g_port = sm->sctp_hdr->dest_port;
 			if (sm->msg == SN_SCTP_INIT)
 				assoc->g_vtag = sm->sctpchnk.Init->initiate_tag;
 			if (AddSctpAssocGlobal(la, assoc)) /* DB clash: need to add dst address */
 				return ((sm->msg == SN_SCTP_INIT) ? SN_REPLY_ABORT : SN_REPLY_ERROR);
 			if (sm->msg == SN_SCTP_ASCONF) {
 				if (AddSctpAssocLocal(la, assoc, sm->ip_hdr->ip_dst)) /* DB clash */
 					return (SN_REPLY_ERROR);
 				assoc->TableRegister |= SN_WAIT_TOLOCAL; /* wait for tolocal ack */
 			}
 		break;
 		case SN_TO_LOCAL:
 			assoc->l_addr = FindSctpRedirectAddress(la, sm);
 			assoc->a_addr = sm->ip_hdr->ip_dst;
 			assoc->l_port = sm->sctp_hdr->dest_port;
 			assoc->g_port = sm->sctp_hdr->src_port;
 			if (sm->msg == SN_SCTP_INIT)
 				assoc->l_vtag = sm->sctpchnk.Init->initiate_tag;
 			if (AddSctpAssocLocal(la, assoc, sm->ip_hdr->ip_src)) /* DB clash */
 				return ((sm->msg == SN_SCTP_INIT) ? SN_REPLY_ABORT : SN_REPLY_ERROR);
 			if (sm->msg == SN_SCTP_ASCONF) {
 				if (AddSctpAssocGlobal(la, assoc)) /* DB clash: need to add src address */
 					return (SN_REPLY_ERROR);
 				assoc->TableRegister |= SN_WAIT_TOGLOBAL; /* wait for toglobal ack */
 			}
 			break;
 		}
 		assoc->state = (sm->msg == SN_SCTP_INIT) ? SN_INi : SN_INa;
 		assoc->exp = SN_I_T(la);
 		sctp_AddTimeOut(la,assoc);
 		return (SN_NAT_PKT);
 	default: /* Any other type of SCTP message is not valid in Idle */
 		return (SN_DROP_PKT);
 	}
 	return (SN_DROP_PKT);/* shouldn't get here very bad: log, drop and hope for the best */
 }
 
 /** @ingroup state_machine
  * @brief Process SCTP message while waiting for an INIT-ACK message
  *
  * Only an INIT-ACK, resent INIT, or an ABORT SCTP packet are valid in this
  * state, all other packets are dropped.
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_NAT_PKT | SN_DROP_PKT | SN_REPLY_ABORT
  */
 static int
 INi_process(struct libalias *la, int direction, struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm)
 {
 	switch (sm->msg) {
 	case SN_SCTP_INIT:            /* a packet containing a retransmitted INIT chunk */
 		sctp_ResetTimeOut(la, assoc, SN_I_T(la));
 		return (SN_NAT_PKT);
 	case SN_SCTP_INITACK:         /* a packet containing an INIT-ACK chunk */
 		switch (direction) {
 		case SN_TO_LOCAL:
 			if (assoc->num_Gaddr) /*If tracking global addresses for this association */
 				AddGlobalIPAddresses(sm, assoc, direction);
 			assoc->l_vtag = sm->sctpchnk.Init->initiate_tag;
 			if (AddSctpAssocLocal(la, assoc, sm->ip_hdr->ip_src)) { /* DB clash */
 				assoc->state = SN_RM;/* Mark for removal*/
 				return (SN_SEND_ABORT);
 			}
 			break;
 		case SN_TO_GLOBAL:
 			assoc->l_addr = sm->ip_hdr->ip_src; // Only if not set in Init! *
 			assoc->g_vtag = sm->sctpchnk.Init->initiate_tag;
 			if (AddSctpAssocGlobal(la, assoc)) { /* DB clash */
 				assoc->state = SN_RM;/* Mark for removal*/
 				return (SN_SEND_ABORT);
 			}
 			break;
 		}
 		assoc->state = SN_UP;/* association established for NAT */
 		sctp_ResetTimeOut(la,assoc, SN_U_T(la));
 		return (SN_NAT_PKT);
 	case SN_SCTP_ABORT:           /* a packet containing an ABORT chunk */
 		assoc->state = SN_RM;/* Mark for removal*/
 		return (SN_NAT_PKT);
 	default:
 		return (SN_DROP_PKT);
 	}
 	return (SN_DROP_PKT);/* shouldn't get here very bad: log, drop and hope for the best */
 }
 
 /** @ingroup state_machine
  * @brief Process SCTP message while waiting for an AddIp-ACK message
  *
  * Only an AddIP-ACK, resent AddIP, or an ABORT message are valid, all other
  * SCTP packets are dropped
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_NAT_PKT | SN_DROP_PKT
  */
 static int
 INa_process(struct libalias *la, int direction,struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm)
 {
 	switch (sm->msg) {
 	case SN_SCTP_ASCONF:           /* a packet containing an ASCONF chunk*/
 		sctp_ResetTimeOut(la,assoc, SN_I_T(la));
 		return (SN_NAT_PKT);
 	case SN_SCTP_ASCONFACK:        /* a packet containing an ASCONF chunk with a ADDIP-ACK */
 		switch (direction) {
 		case SN_TO_LOCAL:
 			if (!(assoc->TableRegister & SN_WAIT_TOLOCAL)) /* wrong direction */
 				return (SN_DROP_PKT);
 			break;
 		case SN_TO_GLOBAL:
 			if (!(assoc->TableRegister & SN_WAIT_TOGLOBAL)) /* wrong direction */
 				return (SN_DROP_PKT);
 		}
 		if (IsASCONFack(la,sm,direction)) {
 			assoc->TableRegister &= SN_BOTH_TBL; /* remove wait flags */
 			assoc->state = SN_UP; /* association established for NAT */
 			sctp_ResetTimeOut(la,assoc, SN_U_T(la));
 			return (SN_NAT_PKT);
 		} else {
 			assoc->state = SN_RM;/* Mark for removal*/
 			return (SN_NAT_PKT);
 		}
 	case SN_SCTP_ABORT:           /* a packet containing an ABORT chunk */
 		assoc->state = SN_RM;/* Mark for removal*/
 		return (SN_NAT_PKT);
 	default:
 		return (SN_DROP_PKT);
 	}
 	return (SN_DROP_PKT);/* shouldn't get here very bad: log, drop and hope for the best */
 }
 
 /** @ingroup state_machine
  * @brief Process SCTP messages while association is UP redirecting packets
  *
  * While in the SN_UP state, all packets for the particular association
  * are passed. Only a SHUT-ACK or an ABORT will cause a change of state.
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_NAT_PKT | SN_DROP_PKT
  */
 static int
 UP_process(struct libalias *la, int direction, struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm)
 {
 	switch (sm->msg) {
 	case SN_SCTP_SHUTACK:         /* a packet containing a SHUTDOWN-ACK chunk */
 		assoc->state = SN_CL;
 		sctp_ResetTimeOut(la,assoc, SN_C_T(la));
 		return (SN_NAT_PKT);
 	case SN_SCTP_ABORT:           /* a packet containing an ABORT chunk */
 		assoc->state = SN_RM;/* Mark for removal*/
 		return (SN_NAT_PKT);
 	case SN_SCTP_ASCONF:           /* a packet containing an ASCONF chunk*/
 		if ((direction == SN_TO_LOCAL) && assoc->num_Gaddr) /*If tracking global addresses for this association & from global side */
 			switch (IsADDorDEL(la,sm,direction)) {
 			case SCTP_ADD_IP_ADDRESS:
 				AddGlobalIPAddresses(sm, assoc, direction);
 				break;
 			case SCTP_DEL_IP_ADDRESS:
 				RmGlobalIPAddresses(sm, assoc, direction);
 				break;
 			}
-		/* fall through to default */
+		/* FALLTHROUGH */
 	default:
 		sctp_ResetTimeOut(la,assoc, SN_U_T(la));
 		return (SN_NAT_PKT);  /* forward packet */
 	}
 	return (SN_DROP_PKT);/* shouldn't get here very bad: log, drop and hope for the best */
 }
 
 /** @ingroup state_machine
  * @brief Process SCTP message while association is in the process of closing
  *
  * This function waits for a SHUT-COMP to close the association. Depending on
  * the setting of sysctl_holddown_timer it may not remove the association
  * immediately, but leave it up until SN_X_T(la). Only SHUT-COMP, SHUT-ACK, and
  * ABORT packets are permitted in this state. All other packets are dropped.
  *
  * @param la Pointer to the relevant libalias instance
  * @param direction SN_TO_LOCAL | SN_TO_GLOBAL
  * @param sm Pointer to sctp message information
  * @param assoc Pointer to the association this SCTP Message belongs to
  *
  * @return SN_NAT_PKT | SN_DROP_PKT
  */
 static int
 CL_process(struct libalias *la, int direction,struct sctp_nat_assoc *assoc, struct sctp_nat_msg *sm)
 {
 	switch (sm->msg) {
 	case SN_SCTP_SHUTCOMP:        /* a packet containing a SHUTDOWN-COMPLETE chunk */
 		assoc->state = SN_CL;  /* Stay in Close state until timeout */
 		if (sysctl_holddown_timer > 0)
 			sctp_ResetTimeOut(la, assoc, SN_X_T(la));/* allow to stay open for Tbit packets*/
 		else
 			assoc->state = SN_RM;/* Mark for removal*/
 		return (SN_NAT_PKT);
 	case SN_SCTP_SHUTACK:         /* a packet containing a SHUTDOWN-ACK chunk */
 		assoc->state = SN_CL;  /* Stay in Close state until timeout */
 		sctp_ResetTimeOut(la, assoc, SN_C_T(la));
 		return (SN_NAT_PKT);
 	case SN_SCTP_ABORT:           /* a packet containing an ABORT chunk */
 		assoc->state = SN_RM;/* Mark for removal*/
 		return (SN_NAT_PKT);
 	default:
 		return (SN_DROP_PKT);
 	}
 	return (SN_DROP_PKT);/* shouldn't get here very bad: log, drop and hope for the best */
 }
 
 /* ----------------------------------------------------------------------
  *                           HASH TABLE CODE
  * ----------------------------------------------------------------------
  */
 /** @addtogroup Hash
  *
  * The Hash functions facilitate searching the NAT Hash Tables for associations
  * as well as adding/removing associations from the table(s).
  */
 /** @ingroup Hash
  * @brief Find the SCTP association given the local address, port and vtag
  *
  * Searches the local look-up table for the association entry matching the
  * provided local <address:ports:vtag> tuple
  *
  * @param la Pointer to the relevant libalias instance
  * @param l_addr local address
  * @param g_addr global address
  * @param l_vtag local Vtag
  * @param l_port local Port
  * @param g_port global Port
  *
  * @return pointer to association or NULL
  */
 static struct sctp_nat_assoc *
 FindSctpLocal(struct libalias *la, struct in_addr l_addr, struct in_addr g_addr, uint32_t l_vtag, uint16_t l_port, uint16_t g_port)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 	struct sctp_GlobalAddress *G_Addr = NULL;
 
 	if (l_vtag != 0) { /* an init packet, vtag==0 */
 		i = SN_TABLE_HASH(l_vtag, l_port, la->sctpNatTableSize);
 		LIST_FOREACH(assoc, &la->sctpTableLocal[i], list_L) {
 			if ((assoc->l_vtag == l_vtag) && (assoc->l_port == l_port) && (assoc->g_port == g_port)\
 			    && (assoc->l_addr.s_addr == l_addr.s_addr)) {
 				if (assoc->num_Gaddr) {
 					LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 						if (G_Addr->g_addr.s_addr == g_addr.s_addr)
 							return (assoc);
 					}
 				} else {
 					return (assoc);
 				}
 			}
 		}
 	}
 	return (NULL);
 }
 
 /** @ingroup Hash
  * @brief Check for Global Clash
  *
  * Searches the global look-up table for the association entry matching the
  * provided global <(addresses):ports:vtag> tuple
  *
  * @param la Pointer to the relevant libalias instance
  * @param Cassoc association being checked for a clash
  *
  * @return pointer to association or NULL
  */
 static struct sctp_nat_assoc *
 FindSctpGlobalClash(struct libalias *la, struct sctp_nat_assoc *Cassoc)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 	struct sctp_GlobalAddress *G_Addr = NULL;
 	struct sctp_GlobalAddress *G_AddrC = NULL;
 
 	if (Cassoc->g_vtag != 0) { /* an init packet, vtag==0 */
 		i = SN_TABLE_HASH(Cassoc->g_vtag, Cassoc->g_port, la->sctpNatTableSize);
 		LIST_FOREACH(assoc, &la->sctpTableGlobal[i], list_G) {
 			if ((assoc->g_vtag == Cassoc->g_vtag) && (assoc->g_port == Cassoc->g_port) && (assoc->l_port == Cassoc->l_port)) {
 				if (assoc->num_Gaddr) {
 					LIST_FOREACH(G_AddrC, &(Cassoc->Gaddr), list_Gaddr) {
 						LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 							if (G_Addr->g_addr.s_addr == G_AddrC->g_addr.s_addr)
 								return (assoc);
 						}
 					}
 				} else {
 					return (assoc);
 				}
 			}
 		}
 	}
 	return (NULL);
 }
 
 /** @ingroup Hash
  * @brief Find the SCTP association given the global port and vtag
  *
  * Searches the global look-up table for the association entry matching the
  * provided global <address:ports:vtag> tuple
  *
  * If all but the global address match it sets partial_match to 1 to indicate a
  * partial match. If the NAT is tracking global IP addresses for this
  * association, the NAT may respond with an ERRORM to request the missing
  * address to be added.
  *
  * @param la Pointer to the relevant libalias instance
  * @param g_addr global address
  * @param g_vtag global vtag
  * @param g_port global port
  * @param l_port local port
  *
  * @return pointer to association or NULL
  */
 static struct sctp_nat_assoc *
 FindSctpGlobal(struct libalias *la, struct in_addr g_addr, uint32_t g_vtag, uint16_t g_port, uint16_t l_port, int *partial_match)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 	struct sctp_GlobalAddress *G_Addr = NULL;
 
 	*partial_match = 0;
 	if (g_vtag != 0) { /* an init packet, vtag==0 */
 		i = SN_TABLE_HASH(g_vtag, g_port, la->sctpNatTableSize);
 		LIST_FOREACH(assoc, &la->sctpTableGlobal[i], list_G) {
 			if ((assoc->g_vtag == g_vtag) && (assoc->g_port == g_port) && (assoc->l_port == l_port)) {
 				*partial_match = 1;
 				if (assoc->num_Gaddr) {
 					LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 						if (G_Addr->g_addr.s_addr == g_addr.s_addr)
 							return (assoc);
 					}
 				} else {
 					return (assoc);
 				}
 			}
 		}
 	}
 	return (NULL);
 }
 
 /** @ingroup Hash
  * @brief Find the SCTP association for a T-Flag message (given the global port and local vtag)
  *
  * Searches the local look-up table for a unique association entry matching the
  * provided global port and local vtag information
  *
  * @param la Pointer to the relevant libalias instance
  * @param g_addr global address
  * @param l_vtag local Vtag
  * @param g_port global Port
  * @param l_port local Port
  *
  * @return pointer to association or NULL
  */
 static struct sctp_nat_assoc *
 FindSctpLocalT(struct libalias *la, struct in_addr g_addr, uint32_t l_vtag, uint16_t g_port, uint16_t l_port)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL, *lastmatch = NULL;
 	struct sctp_GlobalAddress *G_Addr = NULL;
 	int cnt = 0;
 
 	if (l_vtag != 0) { /* an init packet, vtag==0 */
 		i = SN_TABLE_HASH(l_vtag, g_port, la->sctpNatTableSize);
 		LIST_FOREACH(assoc, &la->sctpTableGlobal[i], list_G) {
 			if ((assoc->g_vtag == l_vtag) && (assoc->g_port == g_port) && (assoc->l_port == l_port)) {
 				if (assoc->num_Gaddr) {
 					LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 						if (G_Addr->g_addr.s_addr == g_addr.s_addr)
 							return (assoc); /* full match */
 					}
 				} else {
 					if (++cnt > 1)
 						return (NULL);
 					lastmatch = assoc;
 				}
 			}
 		}
 	}
 	/* If there is more than one match we do not know which local address to send to */
 	return (cnt ? lastmatch : NULL);
 }
 
 /** @ingroup Hash
  * @brief Find the SCTP association for a T-Flag message (given the local port and global vtag)
  *
  * Searches the global look-up table for a unique association entry matching the
  * provided local port and global vtag information
  *
  * @param la Pointer to the relevant libalias instance
  * @param g_addr global address
  * @param g_vtag global vtag
  * @param l_port local port
  * @param g_port global port
  *
  * @return pointer to association or NULL
  */
 static struct sctp_nat_assoc *
 FindSctpGlobalT(struct libalias *la, struct in_addr g_addr, uint32_t g_vtag, uint16_t l_port, uint16_t g_port)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 	struct sctp_GlobalAddress *G_Addr = NULL;
 
 	if (g_vtag != 0) { /* an init packet, vtag==0 */
 		i = SN_TABLE_HASH(g_vtag, l_port, la->sctpNatTableSize);
 		LIST_FOREACH(assoc, &la->sctpTableLocal[i], list_L) {
 			if ((assoc->l_vtag == g_vtag) && (assoc->l_port == l_port) && (assoc->g_port == g_port)) {
 				if (assoc->num_Gaddr) {
 					LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 						if (G_Addr->g_addr.s_addr == g_addr.s_addr)
 							return (assoc);
 					}
 				} else {
 					return (assoc);
 				}
 			}
 		}
 	}
 	return (NULL);
 }
 
 /** @ingroup Hash
  * @brief  Add the sctp association information to the local look up table
  *
  * Searches the local look-up table for an existing association with the same
  * details. If a match exists and is ONLY in the local look-up table then this
  * is a repeated INIT packet, we need to remove this association from the
  * look-up table and add the new association
  *
  * The new association is added to the head of the list and state is updated
  *
  * @param la Pointer to the relevant libalias instance
  * @param assoc pointer to sctp association
  * @param g_addr global address
  *
  * @return SN_ADD_OK | SN_ADD_CLASH
  */
 static int
 AddSctpAssocLocal(struct libalias *la, struct sctp_nat_assoc *assoc, struct in_addr g_addr)
 {
 	struct sctp_nat_assoc *found;
 
 	LIBALIAS_LOCK_ASSERT(la);
 	found = FindSctpLocal(la, assoc->l_addr, g_addr, assoc->l_vtag, assoc->l_port, assoc->g_port);
 	/*
 	 * Note that if a different global address initiated this Init,
 	 * ie it wasn't resent as presumed:
 	 *  - the local receiver if receiving it for the first time will establish
 	 *    an association with the new global host
 	 *  - if receiving an init from a different global address after sending a
 	 *    lost initack it will send an initack to the new global host, the first
 	 *    association attempt will then be blocked if retried.
 	 */
 	if (found != NULL) {
 		if ((found->TableRegister == SN_LOCAL_TBL) && (found->g_port == assoc->g_port)) { /* resent message */
 			RmSctpAssoc(la, found);
 			sctp_RmTimeOut(la, found);
 			freeGlobalAddressList(found);
 			sn_free(found);
 		} else
 			return (SN_ADD_CLASH);
 	}
 
 	LIST_INSERT_HEAD(&la->sctpTableLocal[SN_TABLE_HASH(assoc->l_vtag, assoc->l_port, la->sctpNatTableSize)],
 	    assoc, list_L);
 	assoc->TableRegister |= SN_LOCAL_TBL;
 	la->sctpLinkCount++; //increment link count
 
 	if (assoc->TableRegister == SN_BOTH_TBL) {
 		/* libalias log -- controlled by libalias */
 		if (la->packetAliasMode & PKT_ALIAS_LOG)
 			SctpShowAliasStats(la);
 
 		SN_LOG(SN_LOG_INFO, logsctpassoc(assoc, "^"));
 	}
 
 	return (SN_ADD_OK);
 }
 
 /** @ingroup Hash
  * @brief  Add the sctp association information to the global look up table
  *
  * Searches the global look-up table for an existing association with the same
  * details. If a match exists and is ONLY in the global look-up table then this
  * is a repeated INIT packet, we need to remove this association from the
  * look-up table and add the new association
  *
  * The new association is added to the head of the list and state is updated
  *
  * @param la Pointer to the relevant libalias instance
  * @param assoc pointer to sctp association
  *
  * @return SN_ADD_OK | SN_ADD_CLASH
  */
 static int
 AddSctpAssocGlobal(struct libalias *la, struct sctp_nat_assoc *assoc)
 {
 	struct sctp_nat_assoc *found;
 
 	LIBALIAS_LOCK_ASSERT(la);
 	found = FindSctpGlobalClash(la, assoc);
 	if (found != NULL) {
 		if ((found->TableRegister == SN_GLOBAL_TBL) &&
 		    (found->l_addr.s_addr == assoc->l_addr.s_addr) &&
 		    (found->l_port == assoc->l_port)) { /* resent message */
 			RmSctpAssoc(la, found);
 			sctp_RmTimeOut(la, found);
 			freeGlobalAddressList(found);
 			sn_free(found);
 		} else
 			return (SN_ADD_CLASH);
 	}
 
 	LIST_INSERT_HEAD(&la->sctpTableGlobal[SN_TABLE_HASH(assoc->g_vtag, assoc->g_port, la->sctpNatTableSize)],
 	    assoc, list_G);
 	assoc->TableRegister |= SN_GLOBAL_TBL;
 	la->sctpLinkCount++; //increment link count
 
 	if (assoc->TableRegister == SN_BOTH_TBL) {
 		/* libalias log -- controlled by libalias */
 		if (la->packetAliasMode & PKT_ALIAS_LOG)
 			SctpShowAliasStats(la);
 
 		SN_LOG(SN_LOG_INFO, logsctpassoc(assoc, "^"));
 	}
 
 	return (SN_ADD_OK);
 }
 
 /** @ingroup Hash
  * @brief Remove the sctp association information from the look up table
  *
  * For each of the two (local/global) look-up tables, remove the association
  * from that table IF it has been registered in that table.
  *
  * NOTE: The calling code is responsible for freeing memory allocated to the
  *       association structure itself
  *
  * NOTE: The association is NOT removed from the timer queue
  *
  * @param la Pointer to the relevant libalias instance
  * @param assoc pointer to sctp association
  */
 static void
 RmSctpAssoc(struct libalias *la, struct sctp_nat_assoc *assoc)
 {
 	//  struct sctp_nat_assoc *found;
 	if (assoc == NULL) {
 		/* very bad, log and die*/
 		SN_LOG(SN_LOG_LOW,
 		    logsctperror("ERROR: alias_sctp:RmSctpAssoc(NULL)\n", 0, 0, SN_TO_NODIR));
 		return;
 	}
 	/* log if association is fully up and now closing */
 	if (assoc->TableRegister == SN_BOTH_TBL) {
 		SN_LOG(SN_LOG_INFO, logsctpassoc(assoc, "$"));
 	}
 	LIBALIAS_LOCK_ASSERT(la);
 	if (assoc->TableRegister & SN_LOCAL_TBL) {
 		assoc->TableRegister ^= SN_LOCAL_TBL;
 		la->sctpLinkCount--; //decrement link count
 		LIST_REMOVE(assoc, list_L);
 	}
 
 	if (assoc->TableRegister & SN_GLOBAL_TBL) {
 		assoc->TableRegister ^= SN_GLOBAL_TBL;
 		la->sctpLinkCount--; //decrement link count
 		LIST_REMOVE(assoc, list_G);
 	}
 	//  sn_free(assoc); //Don't remove now, remove if needed later
 	/* libalias logging -- controlled by libalias log definition */
 	if (la->packetAliasMode & PKT_ALIAS_LOG)
 		SctpShowAliasStats(la);
 }
 
 /**
  * @ingroup Hash
  * @brief  free the Global Address List memory
  *
  * freeGlobalAddressList deletes all global IP addresses in an associations
  * global IP address list.
  *
  * @param assoc
  */
 static void freeGlobalAddressList(struct sctp_nat_assoc *assoc)
 {
 	struct sctp_GlobalAddress *gaddr1=NULL,*gaddr2=NULL;
 	/*free global address list*/
 	gaddr1 = LIST_FIRST(&(assoc->Gaddr));
 	while (gaddr1 != NULL) {
 		gaddr2 = LIST_NEXT(gaddr1, list_Gaddr);
 		sn_free(gaddr1);
 		gaddr1 = gaddr2;
 	}
 }
 /* ----------------------------------------------------------------------
  *                            TIMER QUEUE CODE
  * ----------------------------------------------------------------------
  */
 /** @addtogroup Timer
  *
  * The timer queue management functions are designed to operate efficiently with
  * a minimum of interaction with the queues.
  *
  * Once a timeout is set in the queue it will not be altered in the queue unless
  * it has to be changed to a shorter time (usually only for aborts and closing).
  * On a queue timeout, the real expiry time is checked, and if not leq than the
  * timeout it is requeued (O(1)) at its later time. This is especially important
  * for normal packets sent during an association. When a timer expires, it is
  * updated to its new expiration time if necessary, or processed as a
  * timeout. This means that while in UP state, the timing queue is only altered
  * every U_T (every few minutes) for a particular association.
  */
 /** @ingroup Timer
  * @brief Add an association timeout to the timer queue
  *
  * Determine the location in the queue to add the timeout and insert the
  * association into the list at that queue position
  *
  * @param la
  * @param assoc
  */
 static void
 sctp_AddTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc)
 {
 	int add_loc;
 	LIBALIAS_LOCK_ASSERT(la);
 	add_loc = assoc->exp - la->sctpNatTimer.loc_time + la->sctpNatTimer.cur_loc;
 	if (add_loc >= SN_TIMER_QUEUE_SIZE)
 		add_loc -= SN_TIMER_QUEUE_SIZE;
 	LIST_INSERT_HEAD(&la->sctpNatTimer.TimerQ[add_loc], assoc, timer_Q);
 	assoc->exp_loc = add_loc;
 }
 
 /** @ingroup Timer
  * @brief Remove an association from timer queue
  *
  * This is an O(1) operation to remove the association pointer from its
  * current position in the timer queue
  *
  * @param la Pointer to the relevant libalias instance
  * @param assoc pointer to sctp association
  */
 static void
 sctp_RmTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc)
 {
 	LIBALIAS_LOCK_ASSERT(la);
 	LIST_REMOVE(assoc, timer_Q);/* Note this is O(1) */
 }
 
 /** @ingroup Timer
  * @brief Reset timer in timer queue
  *
  * Reset the actual timeout for the specified association. If it is earlier than
  * the existing timeout, then remove and re-install the association into the
  * queue
  *
  * @param la Pointer to the relevant libalias instance
  * @param assoc pointer to sctp association
  * @param newexp New expiration time
  */
 static void
 sctp_ResetTimeOut(struct libalias *la, struct sctp_nat_assoc *assoc, int newexp)
 {
 	if (newexp < assoc->exp) {
 		sctp_RmTimeOut(la, assoc);
 		assoc->exp = newexp;
 		sctp_AddTimeOut(la, assoc);
 	} else {
 		assoc->exp = newexp;
 	}
 }
 
 /** @ingroup Timer
  * @brief Check timer Q against current time
  *
  * Loop through each entry in the timer queue since the last time we processed
  * the timer queue until now (the current time). For each association in the
  * event list, we remove it from that position in the timer queue and check if
  * it has really expired. If so we:
  * - Log the timer expiry
  * - Remove the association from the NAT tables
  * - Release the memory used by the association
  *
  * If the timer hasn't really expired we place the association into its new
  * correct position in the timer queue.
  *
  * @param la  Pointer to the relevant libalias instance
  */
 void
 sctp_CheckTimers(struct libalias *la)
 {
 	struct sctp_nat_assoc *assoc;
 
 	LIBALIAS_LOCK_ASSERT(la);
 	while(LibAliasTime >= la->sctpNatTimer.loc_time) {
 		while (!LIST_EMPTY(&la->sctpNatTimer.TimerQ[la->sctpNatTimer.cur_loc])) {
 			assoc = LIST_FIRST(&la->sctpNatTimer.TimerQ[la->sctpNatTimer.cur_loc]);
 			//SLIST_REMOVE_HEAD(&la->sctpNatTimer.TimerQ[la->sctpNatTimer.cur_loc], timer_Q);
 			LIST_REMOVE(assoc, timer_Q);
 			if (LibAliasTime >= assoc->exp) { /* state expired */
 				SN_LOG(((assoc->state == SN_CL) ? (SN_LOG_DEBUG) : (SN_LOG_INFO)),
 				    logsctperror("Timer Expired", assoc->g_vtag, assoc->state, SN_TO_NODIR));
 				RmSctpAssoc(la, assoc);
 				freeGlobalAddressList(assoc);
 				sn_free(assoc);
 			} else {/* state not expired, reschedule timer*/
 				sctp_AddTimeOut(la, assoc);
 			}
 		}
 		/* Goto next location in the timer queue*/
 		++la->sctpNatTimer.loc_time;
 		if (++la->sctpNatTimer.cur_loc >= SN_TIMER_QUEUE_SIZE)
 			la->sctpNatTimer.cur_loc = 0;
 	}
 }
 
 /* ----------------------------------------------------------------------
  *                              LOGGING CODE
  * ----------------------------------------------------------------------
  */
 /** @addtogroup Logging
  *
  * The logging functions provide logging of different items ranging from logging
  * a simple message, through logging an association details to logging the
  * current state of the NAT tables
  */
 /** @ingroup Logging
  * @brief Log sctp nat errors
  *
  * @param errormsg Error message to be logged
  * @param vtag Current Vtag
  * @param error Error number
  * @param direction Direction of packet
  */
 static void
 logsctperror(char *errormsg, uint32_t vtag, int error, int direction)
 {
 	char dir;
 	switch (direction) {
 	case SN_TO_LOCAL:
 		dir = 'L';
 		break;
 	case SN_TO_GLOBAL:
 		dir = 'G';
 		break;
 	default:
 		dir = '*';
 		break;
 	}
 	SctpAliasLog("->%c %s (vt=%u) %d\n", dir, errormsg, ntohl(vtag), error);
 }
 
 /** @ingroup Logging
  * @brief Log what the parser parsed
  *
  * @param direction Direction of packet
  * @param sm Pointer to sctp message information
  */
 static void
 logsctpparse(int direction, struct sctp_nat_msg *sm)
 {
 	char *ploc, *pstate;
 	switch (direction) {
 	case SN_TO_LOCAL:
 		ploc = "TO_LOCAL -";
 		break;
 	case SN_TO_GLOBAL:
 		ploc = "TO_GLOBAL -";
 		break;
 	default:
 		ploc = "";
 	}
 	switch (sm->msg) {
 	case SN_SCTP_INIT:
 		pstate = "Init";
 		break;
 	case SN_SCTP_INITACK:
 		pstate = "InitAck";
 		break;
 	case SN_SCTP_ABORT:
 		pstate = "Abort";
 		break;
 	case SN_SCTP_SHUTACK:
 		pstate = "ShutAck";
 		break;
 	case SN_SCTP_SHUTCOMP:
 		pstate = "ShutComp";
 		break;
 	case SN_SCTP_ASCONF:
 		pstate = "Asconf";
 		break;
 	case SN_SCTP_ASCONFACK:
 		pstate = "AsconfAck";
 		break;
 	case SN_SCTP_OTHER:
 		pstate = "Other";
 		break;
 	default:
 		pstate = "***ERROR***";
 		break;
 	}
 	SctpAliasLog("Parsed: %s %s\n", ploc, pstate);
 }
 
 /** @ingroup Logging
  * @brief Log an SCTP association's details
  *
  * @param assoc pointer to sctp association
  * @param s Character that indicates the state of processing for this packet
  */
 static void logsctpassoc(struct sctp_nat_assoc *assoc, char *s)
 {
 	struct sctp_GlobalAddress *G_Addr = NULL;
 	char *sp;
 	char addrbuf[INET_ADDRSTRLEN];
 
 	switch (assoc->state) {
 	case SN_ID:
 		sp = "ID ";
 		break;
 	case SN_INi:
 		sp = "INi ";
 		break;
 	case SN_INa:
 		sp = "INa ";
 		break;
 	case SN_UP:
 		sp = "UP ";
 		break;
 	case SN_CL:
 		sp = "CL ";
 		break;
 	case SN_RM:
 		sp = "RM ";
 		break;
 	default:
 		sp = "***ERROR***";
 		break;
 	}
 	SctpAliasLog("%sAssoc: %s exp=%u la=%s lv=%u lp=%u gv=%u gp=%u tbl=%d\n",
 	    s, sp, assoc->exp, inet_ntoa_r(assoc->l_addr, addrbuf),
 	    ntohl(assoc->l_vtag), ntohs(assoc->l_port),
 	    ntohl(assoc->g_vtag), ntohs(assoc->g_port),
 	    assoc->TableRegister);
 	/* list global addresses */
 	LIST_FOREACH(G_Addr, &(assoc->Gaddr), list_Gaddr) {
 		SctpAliasLog("\t\tga=%s\n",
 		    inet_ntoa_r(G_Addr->g_addr, addrbuf));
 	}
 }
 
 /** @ingroup Logging
  * @brief Output Global table to log
  *
  * @param la Pointer to the relevant libalias instance
  */
 static void logSctpGlobal(struct libalias *la)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 
 	SctpAliasLog("G->\n");
 	for (i = 0; i < la->sctpNatTableSize; i++) {
 		LIST_FOREACH(assoc, &la->sctpTableGlobal[i], list_G) {
 			logsctpassoc(assoc, " ");
 		}
 	}
 }
 
 /** @ingroup Logging
  * @brief  Output Local table to log
  *
  * @param la Pointer to the relevant libalias instance
  */
 static void logSctpLocal(struct libalias *la)
 {
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 
 	SctpAliasLog("L->\n");
 	for (i = 0; i < la->sctpNatTableSize; i++) {
 		LIST_FOREACH(assoc, &la->sctpTableLocal[i], list_L) {
 			logsctpassoc(assoc, " ");
 		}
 	}
 }
 
 /** @ingroup Logging
  * @brief Output timer queue to log
  *
  * @param la Pointer to the relevant libalias instance
  */
 static void logTimerQ(struct libalias *la)
 {
 	static char buf[50];
 	u_int i;
 	struct sctp_nat_assoc *assoc = NULL;
 
 	SctpAliasLog("t->\n");
 	for (i = 0; i < SN_TIMER_QUEUE_SIZE; i++) {
 		LIST_FOREACH(assoc, &la->sctpNatTimer.TimerQ[i], timer_Q) {
 			snprintf(buf, 50, " l=%u ",i);
 			//SctpAliasLog(la->logDesc," l=%d ",i);
 			logsctpassoc(assoc, buf);
 		}
 	}
 }
 
 /** @ingroup Logging
  * @brief Sctp NAT logging function
  *
  * This function is based on a similar function in alias_db.c
  *
  * @param str/stream logging descriptor
  * @param format printf type string
  */
 #ifdef _KERNEL
 static void
 SctpAliasLog(const char *format, ...)
 {
 	char buffer[LIBALIAS_BUF_SIZE];
 	va_list ap;
 	va_start(ap, format);
 	vsnprintf(buffer, LIBALIAS_BUF_SIZE, format, ap);
 	va_end(ap);
 	log(LOG_SECURITY | LOG_INFO, "alias_sctp: %s", buffer);
 }
 #else
 static void
 SctpAliasLog(FILE *stream, const char *format, ...)
 {
 	va_list ap;
 
 	va_start(ap, format);
 	vfprintf(stream, format, ap);
 	va_end(ap);
 	fflush(stream);
 }
 #endif
diff --git a/sys/netinet/sctp_output.c b/sys/netinet/sctp_output.c
index fdea88002194..5b4fbb28e089 100644
--- a/sys/netinet/sctp_output.c
+++ b/sys/netinet/sctp_output.c
@@ -1,13842 +1,13842 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 2001-2008, by Cisco Systems, Inc. All rights reserved.
  * Copyright (c) 2008-2012, by Randall Stewart. All rights reserved.
  * Copyright (c) 2008-2012, by Michael Tuexen. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
  *
  * a) Redistributions of source code must retain the above copyright notice,
  *    this list of conditions and the following disclaimer.
  *
  * b) Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in
  *    the documentation and/or other materials provided with the distribution.
  *
  * c) Neither the name of Cisco Systems, Inc. nor the names of its
  *    contributors may be used to endorse or promote products derived
  *    from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
  * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  * THE POSSIBILITY OF SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <netinet/sctp_os.h>
 #include <sys/proc.h>
 #include <netinet/sctp_var.h>
 #include <netinet/sctp_sysctl.h>
 #include <netinet/sctp_header.h>
 #include <netinet/sctp_pcb.h>
 #include <netinet/sctputil.h>
 #include <netinet/sctp_output.h>
 #include <netinet/sctp_uio.h>
 #include <netinet/sctputil.h>
 #include <netinet/sctp_auth.h>
 #include <netinet/sctp_timer.h>
 #include <netinet/sctp_asconf.h>
 #include <netinet/sctp_indata.h>
 #include <netinet/sctp_bsd_addr.h>
 #include <netinet/sctp_input.h>
 #include <netinet/sctp_crc32.h>
 #include <netinet/sctp_kdtrace.h>
 #if defined(INET) || defined(INET6)
 #include <netinet/udp.h>
 #endif
 #include <netinet/udp_var.h>
 #include <machine/in_cksum.h>
 
 #define SCTP_MAX_GAPS_INARRAY 4
 struct sack_track {
 	uint8_t right_edge;	/* mergable on the right edge */
 	uint8_t left_edge;	/* mergable on the left edge */
 	uint8_t num_entries;
 	uint8_t spare;
 	struct sctp_gap_ack_block gaps[SCTP_MAX_GAPS_INARRAY];
 };
 
 const struct sack_track sack_array[256] = {
 	{0, 0, 0, 0,		/* 0x00 */
 		{{0, 0},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x01 */
 		{{0, 0},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x02 */
 		{{1, 1},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x03 */
 		{{0, 1},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x04 */
 		{{2, 2},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x05 */
 		{{0, 0},
 		{2, 2},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x06 */
 		{{1, 2},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x07 */
 		{{0, 2},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x08 */
 		{{3, 3},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x09 */
 		{{0, 0},
 		{3, 3},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x0a */
 		{{1, 1},
 		{3, 3},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x0b */
 		{{0, 1},
 		{3, 3},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x0c */
 		{{2, 3},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x0d */
 		{{0, 0},
 		{2, 3},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x0e */
 		{{1, 3},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x0f */
 		{{0, 3},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x10 */
 		{{4, 4},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x11 */
 		{{0, 0},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x12 */
 		{{1, 1},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x13 */
 		{{0, 1},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x14 */
 		{{2, 2},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x15 */
 		{{0, 0},
 		{2, 2},
 		{4, 4},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x16 */
 		{{1, 2},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x17 */
 		{{0, 2},
 		{4, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x18 */
 		{{3, 4},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x19 */
 		{{0, 0},
 		{3, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x1a */
 		{{1, 1},
 		{3, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x1b */
 		{{0, 1},
 		{3, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x1c */
 		{{2, 4},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x1d */
 		{{0, 0},
 		{2, 4},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x1e */
 		{{1, 4},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x1f */
 		{{0, 4},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x20 */
 		{{5, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x21 */
 		{{0, 0},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x22 */
 		{{1, 1},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x23 */
 		{{0, 1},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x24 */
 		{{2, 2},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x25 */
 		{{0, 0},
 		{2, 2},
 		{5, 5},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x26 */
 		{{1, 2},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x27 */
 		{{0, 2},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x28 */
 		{{3, 3},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x29 */
 		{{0, 0},
 		{3, 3},
 		{5, 5},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x2a */
 		{{1, 1},
 		{3, 3},
 		{5, 5},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x2b */
 		{{0, 1},
 		{3, 3},
 		{5, 5},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x2c */
 		{{2, 3},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x2d */
 		{{0, 0},
 		{2, 3},
 		{5, 5},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x2e */
 		{{1, 3},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x2f */
 		{{0, 3},
 		{5, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x30 */
 		{{4, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x31 */
 		{{0, 0},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x32 */
 		{{1, 1},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x33 */
 		{{0, 1},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x34 */
 		{{2, 2},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x35 */
 		{{0, 0},
 		{2, 2},
 		{4, 5},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x36 */
 		{{1, 2},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x37 */
 		{{0, 2},
 		{4, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x38 */
 		{{3, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x39 */
 		{{0, 0},
 		{3, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x3a */
 		{{1, 1},
 		{3, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x3b */
 		{{0, 1},
 		{3, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x3c */
 		{{2, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x3d */
 		{{0, 0},
 		{2, 5},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x3e */
 		{{1, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x3f */
 		{{0, 5},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x40 */
 		{{6, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x41 */
 		{{0, 0},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x42 */
 		{{1, 1},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x43 */
 		{{0, 1},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x44 */
 		{{2, 2},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x45 */
 		{{0, 0},
 		{2, 2},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x46 */
 		{{1, 2},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x47 */
 		{{0, 2},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x48 */
 		{{3, 3},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x49 */
 		{{0, 0},
 		{3, 3},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x4a */
 		{{1, 1},
 		{3, 3},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x4b */
 		{{0, 1},
 		{3, 3},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x4c */
 		{{2, 3},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x4d */
 		{{0, 0},
 		{2, 3},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x4e */
 		{{1, 3},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x4f */
 		{{0, 3},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x50 */
 		{{4, 4},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x51 */
 		{{0, 0},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x52 */
 		{{1, 1},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x53 */
 		{{0, 1},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x54 */
 		{{2, 2},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 4, 0,		/* 0x55 */
 		{{0, 0},
 		{2, 2},
 		{4, 4},
 		{6, 6}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x56 */
 		{{1, 2},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x57 */
 		{{0, 2},
 		{4, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x58 */
 		{{3, 4},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x59 */
 		{{0, 0},
 		{3, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x5a */
 		{{1, 1},
 		{3, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x5b */
 		{{0, 1},
 		{3, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x5c */
 		{{2, 4},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x5d */
 		{{0, 0},
 		{2, 4},
 		{6, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x5e */
 		{{1, 4},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x5f */
 		{{0, 4},
 		{6, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x60 */
 		{{5, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x61 */
 		{{0, 0},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x62 */
 		{{1, 1},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x63 */
 		{{0, 1},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x64 */
 		{{2, 2},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x65 */
 		{{0, 0},
 		{2, 2},
 		{5, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x66 */
 		{{1, 2},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x67 */
 		{{0, 2},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x68 */
 		{{3, 3},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x69 */
 		{{0, 0},
 		{3, 3},
 		{5, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 3, 0,		/* 0x6a */
 		{{1, 1},
 		{3, 3},
 		{5, 6},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x6b */
 		{{0, 1},
 		{3, 3},
 		{5, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x6c */
 		{{2, 3},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x6d */
 		{{0, 0},
 		{2, 3},
 		{5, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x6e */
 		{{1, 3},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x6f */
 		{{0, 3},
 		{5, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x70 */
 		{{4, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x71 */
 		{{0, 0},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x72 */
 		{{1, 1},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x73 */
 		{{0, 1},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x74 */
 		{{2, 2},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 3, 0,		/* 0x75 */
 		{{0, 0},
 		{2, 2},
 		{4, 6},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x76 */
 		{{1, 2},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x77 */
 		{{0, 2},
 		{4, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x78 */
 		{{3, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x79 */
 		{{0, 0},
 		{3, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 2, 0,		/* 0x7a */
 		{{1, 1},
 		{3, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x7b */
 		{{0, 1},
 		{3, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x7c */
 		{{2, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 2, 0,		/* 0x7d */
 		{{0, 0},
 		{2, 6},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 0, 1, 0,		/* 0x7e */
 		{{1, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 0, 1, 0,		/* 0x7f */
 		{{0, 6},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0x80 */
 		{{7, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0x81 */
 		{{0, 0},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x82 */
 		{{1, 1},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0x83 */
 		{{0, 1},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x84 */
 		{{2, 2},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x85 */
 		{{0, 0},
 		{2, 2},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x86 */
 		{{1, 2},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0x87 */
 		{{0, 2},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x88 */
 		{{3, 3},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x89 */
 		{{0, 0},
 		{3, 3},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0x8a */
 		{{1, 1},
 		{3, 3},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x8b */
 		{{0, 1},
 		{3, 3},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x8c */
 		{{2, 3},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x8d */
 		{{0, 0},
 		{2, 3},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x8e */
 		{{1, 3},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0x8f */
 		{{0, 3},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x90 */
 		{{4, 4},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x91 */
 		{{0, 0},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0x92 */
 		{{1, 1},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x93 */
 		{{0, 1},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0x94 */
 		{{2, 2},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0x95 */
 		{{0, 0},
 		{2, 2},
 		{4, 4},
 		{7, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0x96 */
 		{{1, 2},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x97 */
 		{{0, 2},
 		{4, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x98 */
 		{{3, 4},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x99 */
 		{{0, 0},
 		{3, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0x9a */
 		{{1, 1},
 		{3, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x9b */
 		{{0, 1},
 		{3, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x9c */
 		{{2, 4},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0x9d */
 		{{0, 0},
 		{2, 4},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0x9e */
 		{{1, 4},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0x9f */
 		{{0, 4},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xa0 */
 		{{5, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xa1 */
 		{{0, 0},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xa2 */
 		{{1, 1},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xa3 */
 		{{0, 1},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xa4 */
 		{{2, 2},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xa5 */
 		{{0, 0},
 		{2, 2},
 		{5, 5},
 		{7, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xa6 */
 		{{1, 2},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xa7 */
 		{{0, 2},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xa8 */
 		{{3, 3},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xa9 */
 		{{0, 0},
 		{3, 3},
 		{5, 5},
 		{7, 7}
 		}
 	},
 	{0, 1, 4, 0,		/* 0xaa */
 		{{1, 1},
 		{3, 3},
 		{5, 5},
 		{7, 7}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xab */
 		{{0, 1},
 		{3, 3},
 		{5, 5},
 		{7, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xac */
 		{{2, 3},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xad */
 		{{0, 0},
 		{2, 3},
 		{5, 5},
 		{7, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xae */
 		{{1, 3},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xaf */
 		{{0, 3},
 		{5, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xb0 */
 		{{4, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xb1 */
 		{{0, 0},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xb2 */
 		{{1, 1},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xb3 */
 		{{0, 1},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xb4 */
 		{{2, 2},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xb5 */
 		{{0, 0},
 		{2, 2},
 		{4, 5},
 		{7, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xb6 */
 		{{1, 2},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xb7 */
 		{{0, 2},
 		{4, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xb8 */
 		{{3, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xb9 */
 		{{0, 0},
 		{3, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xba */
 		{{1, 1},
 		{3, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xbb */
 		{{0, 1},
 		{3, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xbc */
 		{{2, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xbd */
 		{{0, 0},
 		{2, 5},
 		{7, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xbe */
 		{{1, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xbf */
 		{{0, 5},
 		{7, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xc0 */
 		{{6, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xc1 */
 		{{0, 0},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xc2 */
 		{{1, 1},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xc3 */
 		{{0, 1},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xc4 */
 		{{2, 2},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xc5 */
 		{{0, 0},
 		{2, 2},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xc6 */
 		{{1, 2},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xc7 */
 		{{0, 2},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xc8 */
 		{{3, 3},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xc9 */
 		{{0, 0},
 		{3, 3},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xca */
 		{{1, 1},
 		{3, 3},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xcb */
 		{{0, 1},
 		{3, 3},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xcc */
 		{{2, 3},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xcd */
 		{{0, 0},
 		{2, 3},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xce */
 		{{1, 3},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xcf */
 		{{0, 3},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xd0 */
 		{{4, 4},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xd1 */
 		{{0, 0},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xd2 */
 		{{1, 1},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xd3 */
 		{{0, 1},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xd4 */
 		{{2, 2},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 4, 0,		/* 0xd5 */
 		{{0, 0},
 		{2, 2},
 		{4, 4},
 		{6, 7}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xd6 */
 		{{1, 2},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xd7 */
 		{{0, 2},
 		{4, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xd8 */
 		{{3, 4},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xd9 */
 		{{0, 0},
 		{3, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xda */
 		{{1, 1},
 		{3, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xdb */
 		{{0, 1},
 		{3, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xdc */
 		{{2, 4},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xdd */
 		{{0, 0},
 		{2, 4},
 		{6, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xde */
 		{{1, 4},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xdf */
 		{{0, 4},
 		{6, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xe0 */
 		{{5, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xe1 */
 		{{0, 0},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xe2 */
 		{{1, 1},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xe3 */
 		{{0, 1},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xe4 */
 		{{2, 2},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xe5 */
 		{{0, 0},
 		{2, 2},
 		{5, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xe6 */
 		{{1, 2},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xe7 */
 		{{0, 2},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xe8 */
 		{{3, 3},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xe9 */
 		{{0, 0},
 		{3, 3},
 		{5, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 3, 0,		/* 0xea */
 		{{1, 1},
 		{3, 3},
 		{5, 7},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xeb */
 		{{0, 1},
 		{3, 3},
 		{5, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xec */
 		{{2, 3},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xed */
 		{{0, 0},
 		{2, 3},
 		{5, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xee */
 		{{1, 3},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xef */
 		{{0, 3},
 		{5, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xf0 */
 		{{4, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xf1 */
 		{{0, 0},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xf2 */
 		{{1, 1},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xf3 */
 		{{0, 1},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xf4 */
 		{{2, 2},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 3, 0,		/* 0xf5 */
 		{{0, 0},
 		{2, 2},
 		{4, 7},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xf6 */
 		{{1, 2},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xf7 */
 		{{0, 2},
 		{4, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xf8 */
 		{{3, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xf9 */
 		{{0, 0},
 		{3, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 2, 0,		/* 0xfa */
 		{{1, 1},
 		{3, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xfb */
 		{{0, 1},
 		{3, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xfc */
 		{{2, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 2, 0,		/* 0xfd */
 		{{0, 0},
 		{2, 7},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{0, 1, 1, 0,		/* 0xfe */
 		{{1, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	},
 	{1, 1, 1, 0,		/* 0xff */
 		{{0, 7},
 		{0, 0},
 		{0, 0},
 		{0, 0}
 		}
 	}
 };
 
 int
 sctp_is_address_in_scope(struct sctp_ifa *ifa,
     struct sctp_scoping *scope,
     int do_update)
 {
 	if ((scope->loopback_scope == 0) &&
 	    (ifa->ifn_p) && SCTP_IFN_IS_IFT_LOOP(ifa->ifn_p)) {
 		/*
 		 * skip loopback if not in scope *
 		 */
 		return (0);
 	}
 	switch (ifa->address.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		if (scope->ipv4_addr_legal) {
 			struct sockaddr_in *sin;
 
 			sin = &ifa->address.sin;
 			if (sin->sin_addr.s_addr == 0) {
 				/* not in scope , unspecified */
 				return (0);
 			}
 			if ((scope->ipv4_local_scope == 0) &&
 			    (IN4_ISPRIVATE_ADDRESS(&sin->sin_addr))) {
 				/* private address not in scope */
 				return (0);
 			}
 		} else {
 			return (0);
 		}
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		if (scope->ipv6_addr_legal) {
 			struct sockaddr_in6 *sin6;
 
 			/*
 			 * Must update the flags,  bummer, which means any
 			 * IFA locks must now be applied HERE <->
 			 */
 			if (do_update) {
 				sctp_gather_internal_ifa_flags(ifa);
 			}
 			if (ifa->localifa_flags & SCTP_ADDR_IFA_UNUSEABLE) {
 				return (0);
 			}
 			/* ok to use deprecated addresses? */
 			sin6 = &ifa->address.sin6;
 			if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
 				/* skip unspecified addresses */
 				return (0);
 			}
 			if (	/* (local_scope == 0) && */
 			    (IN6_IS_ADDR_LINKLOCAL(&sin6->sin6_addr))) {
 				return (0);
 			}
 			if ((scope->site_scope == 0) &&
 			    (IN6_IS_ADDR_SITELOCAL(&sin6->sin6_addr))) {
 				return (0);
 			}
 		} else {
 			return (0);
 		}
 		break;
 #endif
 	default:
 		return (0);
 	}
 	return (1);
 }
 
 static struct mbuf *
 sctp_add_addr_to_mbuf(struct mbuf *m, struct sctp_ifa *ifa, uint16_t *len)
 {
 #if defined(INET) || defined(INET6)
 	struct sctp_paramhdr *paramh;
 	struct mbuf *mret;
 	uint16_t plen;
 #endif
 
 	switch (ifa->address.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		plen = (uint16_t)sizeof(struct sctp_ipv4addr_param);
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		plen = (uint16_t)sizeof(struct sctp_ipv6addr_param);
 		break;
 #endif
 	default:
 		return (m);
 	}
 #if defined(INET) || defined(INET6)
 	if (M_TRAILINGSPACE(m) >= plen) {
 		/* easy side we just drop it on the end */
 		paramh = (struct sctp_paramhdr *)(SCTP_BUF_AT(m, SCTP_BUF_LEN(m)));
 		mret = m;
 	} else {
 		/* Need more space */
 		mret = m;
 		while (SCTP_BUF_NEXT(mret) != NULL) {
 			mret = SCTP_BUF_NEXT(mret);
 		}
 		SCTP_BUF_NEXT(mret) = sctp_get_mbuf_for_msg(plen, 0, M_NOWAIT, 1, MT_DATA);
 		if (SCTP_BUF_NEXT(mret) == NULL) {
 			/* We are hosed, can't add more addresses */
 			return (m);
 		}
 		mret = SCTP_BUF_NEXT(mret);
 		paramh = mtod(mret, struct sctp_paramhdr *);
 	}
 	/* now add the parameter */
 	switch (ifa->address.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		{
 			struct sctp_ipv4addr_param *ipv4p;
 			struct sockaddr_in *sin;
 
 			sin = &ifa->address.sin;
 			ipv4p = (struct sctp_ipv4addr_param *)paramh;
 			paramh->param_type = htons(SCTP_IPV4_ADDRESS);
 			paramh->param_length = htons(plen);
 			ipv4p->addr = sin->sin_addr.s_addr;
 			SCTP_BUF_LEN(mret) += plen;
 			break;
 		}
 #endif
 #ifdef INET6
 	case AF_INET6:
 		{
 			struct sctp_ipv6addr_param *ipv6p;
 			struct sockaddr_in6 *sin6;
 
 			sin6 = &ifa->address.sin6;
 			ipv6p = (struct sctp_ipv6addr_param *)paramh;
 			paramh->param_type = htons(SCTP_IPV6_ADDRESS);
 			paramh->param_length = htons(plen);
 			memcpy(ipv6p->addr, &sin6->sin6_addr,
 			    sizeof(ipv6p->addr));
 			/* clear embedded scope in the address */
 			in6_clearscope((struct in6_addr *)ipv6p->addr);
 			SCTP_BUF_LEN(mret) += plen;
 			break;
 		}
 #endif
 	default:
 		return (m);
 	}
 	if (len != NULL) {
 		*len += plen;
 	}
 	return (mret);
 #endif
 }
 
 struct mbuf *
 sctp_add_addresses_to_i_ia(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
     struct sctp_scoping *scope,
     struct mbuf *m_at, int cnt_inits_to,
     uint16_t *padding_len, uint16_t *chunk_len)
 {
 	struct sctp_vrf *vrf = NULL;
 	int cnt, limit_out = 0, total_count;
 	uint32_t vrf_id;
 
 	vrf_id = inp->def_vrf_id;
 	SCTP_IPI_ADDR_RLOCK();
 	vrf = sctp_find_vrf(vrf_id);
 	if (vrf == NULL) {
 		SCTP_IPI_ADDR_RUNLOCK();
 		return (m_at);
 	}
 	if (inp->sctp_flags & SCTP_PCB_FLAGS_BOUNDALL) {
 		struct sctp_ifa *sctp_ifap;
 		struct sctp_ifn *sctp_ifnp;
 
 		cnt = cnt_inits_to;
 		if (vrf->total_ifa_count > SCTP_COUNT_LIMIT) {
 			limit_out = 1;
 			cnt = SCTP_ADDRESS_LIMIT;
 			goto skip_count;
 		}
 		LIST_FOREACH(sctp_ifnp, &vrf->ifnlist, next_ifn) {
 			if ((scope->loopback_scope == 0) &&
 			    SCTP_IFN_IS_IFT_LOOP(sctp_ifnp)) {
 				/*
 				 * Skip loopback devices if loopback_scope
 				 * not set
 				 */
 				continue;
 			}
 			LIST_FOREACH(sctp_ifap, &sctp_ifnp->ifalist, next_ifa) {
 #ifdef INET
 				if ((sctp_ifap->address.sa.sa_family == AF_INET) &&
 				    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 				    &sctp_ifap->address.sin.sin_addr) != 0)) {
 					continue;
 				}
 #endif
 #ifdef INET6
 				if ((sctp_ifap->address.sa.sa_family == AF_INET6) &&
 				    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 				    &sctp_ifap->address.sin6.sin6_addr) != 0)) {
 					continue;
 				}
 #endif
 				if (sctp_is_addr_restricted(stcb, sctp_ifap)) {
 					continue;
 				}
 				if (sctp_is_address_in_scope(sctp_ifap, scope, 1) == 0) {
 					continue;
 				}
 				cnt++;
 				if (cnt > SCTP_ADDRESS_LIMIT) {
 					break;
 				}
 			}
 			if (cnt > SCTP_ADDRESS_LIMIT) {
 				break;
 			}
 		}
 skip_count:
 		if (cnt > 1) {
 			total_count = 0;
 			LIST_FOREACH(sctp_ifnp, &vrf->ifnlist, next_ifn) {
 				cnt = 0;
 				if ((scope->loopback_scope == 0) &&
 				    SCTP_IFN_IS_IFT_LOOP(sctp_ifnp)) {
 					/*
 					 * Skip loopback devices if
 					 * loopback_scope not set
 					 */
 					continue;
 				}
 				LIST_FOREACH(sctp_ifap, &sctp_ifnp->ifalist, next_ifa) {
 #ifdef INET
 					if ((sctp_ifap->address.sa.sa_family == AF_INET) &&
 					    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 					    &sctp_ifap->address.sin.sin_addr) != 0)) {
 						continue;
 					}
 #endif
 #ifdef INET6
 					if ((sctp_ifap->address.sa.sa_family == AF_INET6) &&
 					    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 					    &sctp_ifap->address.sin6.sin6_addr) != 0)) {
 						continue;
 					}
 #endif
 					if (sctp_is_addr_restricted(stcb, sctp_ifap)) {
 						continue;
 					}
 					if (sctp_is_address_in_scope(sctp_ifap,
 					    scope, 0) == 0) {
 						continue;
 					}
 					if ((chunk_len != NULL) &&
 					    (padding_len != NULL) &&
 					    (*padding_len > 0)) {
 						memset(mtod(m_at, caddr_t)+*chunk_len, 0, *padding_len);
 						SCTP_BUF_LEN(m_at) += *padding_len;
 						*chunk_len += *padding_len;
 						*padding_len = 0;
 					}
 					m_at = sctp_add_addr_to_mbuf(m_at, sctp_ifap, chunk_len);
 					if (limit_out) {
 						cnt++;
 						total_count++;
 						if (cnt >= 2) {
 							/*
 							 * two from each
 							 * address
 							 */
 							break;
 						}
 						if (total_count > SCTP_ADDRESS_LIMIT) {
 							/* No more addresses */
 							break;
 						}
 					}
 				}
 			}
 		}
 	} else {
 		struct sctp_laddr *laddr;
 
 		cnt = cnt_inits_to;
 		/* First, how many ? */
 		LIST_FOREACH(laddr, &inp->sctp_addr_list, sctp_nxt_addr) {
 			if (laddr->ifa == NULL) {
 				continue;
 			}
 			if (laddr->ifa->localifa_flags & SCTP_BEING_DELETED)
 				/*
 				 * Address being deleted by the system, dont
 				 * list.
 				 */
 				continue;
 			if (laddr->action == SCTP_DEL_IP_ADDRESS) {
 				/*
 				 * Address being deleted on this ep don't
 				 * list.
 				 */
 				continue;
 			}
 			if (sctp_is_address_in_scope(laddr->ifa,
 			    scope, 1) == 0) {
 				continue;
 			}
 			cnt++;
 		}
 		/*
 		 * To get through a NAT we only list addresses if we have
 		 * more than one. That way if you just bind a single address
 		 * we let the source of the init dictate our address.
 		 */
 		if (cnt > 1) {
 			cnt = cnt_inits_to;
 			LIST_FOREACH(laddr, &inp->sctp_addr_list, sctp_nxt_addr) {
 				if (laddr->ifa == NULL) {
 					continue;
 				}
 				if (laddr->ifa->localifa_flags & SCTP_BEING_DELETED) {
 					continue;
 				}
 				if (sctp_is_address_in_scope(laddr->ifa,
 				    scope, 0) == 0) {
 					continue;
 				}
 				if ((chunk_len != NULL) &&
 				    (padding_len != NULL) &&
 				    (*padding_len > 0)) {
 					memset(mtod(m_at, caddr_t)+*chunk_len, 0, *padding_len);
 					SCTP_BUF_LEN(m_at) += *padding_len;
 					*chunk_len += *padding_len;
 					*padding_len = 0;
 				}
 				m_at = sctp_add_addr_to_mbuf(m_at, laddr->ifa, chunk_len);
 				cnt++;
 				if (cnt >= SCTP_ADDRESS_LIMIT) {
 					break;
 				}
 			}
 		}
 	}
 	SCTP_IPI_ADDR_RUNLOCK();
 	return (m_at);
 }
 
 static struct sctp_ifa *
 sctp_is_ifa_addr_preferred(struct sctp_ifa *ifa,
     uint8_t dest_is_loop,
     uint8_t dest_is_priv,
     sa_family_t fam)
 {
 	uint8_t dest_is_global = 0;
 
 	/* dest_is_priv is true if destination is a private address */
 	/* dest_is_loop is true if destination is a loopback addresses */
 
 	/**
 	 * Here we determine if its a preferred address. A preferred address
 	 * means it is the same scope or higher scope then the destination.
 	 * L = loopback, P = private, G = global
 	 * -----------------------------------------
 	 *    src    |  dest | result
 	 *  ----------------------------------------
 	 *     L     |    L  |    yes
 	 *  -----------------------------------------
 	 *     P     |    L  |    yes-v4 no-v6
 	 *  -----------------------------------------
 	 *     G     |    L  |    yes-v4 no-v6
 	 *  -----------------------------------------
 	 *     L     |    P  |    no
 	 *  -----------------------------------------
 	 *     P     |    P  |    yes
 	 *  -----------------------------------------
 	 *     G     |    P  |    no
 	 *   -----------------------------------------
 	 *     L     |    G  |    no
 	 *   -----------------------------------------
 	 *     P     |    G  |    no
 	 *    -----------------------------------------
 	 *     G     |    G  |    yes
 	 *    -----------------------------------------
 	 */
 
 	if (ifa->address.sa.sa_family != fam) {
 		/* forget mis-matched family */
 		return (NULL);
 	}
 	if ((dest_is_priv == 0) && (dest_is_loop == 0)) {
 		dest_is_global = 1;
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Is destination preferred:");
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &ifa->address.sa);
 	/* Ok the address may be ok */
 #ifdef INET6
 	if (fam == AF_INET6) {
 		/* ok to use deprecated addresses? no lets not! */
 		if (ifa->localifa_flags & SCTP_ADDR_IFA_UNUSEABLE) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:1\n");
 			return (NULL);
 		}
 		if (ifa->src_is_priv && !ifa->src_is_loop) {
 			if (dest_is_loop) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:2\n");
 				return (NULL);
 			}
 		}
 		if (ifa->src_is_glob) {
 			if (dest_is_loop) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:3\n");
 				return (NULL);
 			}
 		}
 	}
 #endif
 	/*
 	 * Now that we know what is what, implement or table this could in
 	 * theory be done slicker (it used to be), but this is
 	 * straightforward and easier to validate :-)
 	 */
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "src_loop:%d src_priv:%d src_glob:%d\n",
 	    ifa->src_is_loop, ifa->src_is_priv, ifa->src_is_glob);
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "dest_loop:%d dest_priv:%d dest_glob:%d\n",
 	    dest_is_loop, dest_is_priv, dest_is_global);
 
 	if ((ifa->src_is_loop) && (dest_is_priv)) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:4\n");
 		return (NULL);
 	}
 	if ((ifa->src_is_glob) && (dest_is_priv)) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:5\n");
 		return (NULL);
 	}
 	if ((ifa->src_is_loop) && (dest_is_global)) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:6\n");
 		return (NULL);
 	}
 	if ((ifa->src_is_priv) && (dest_is_global)) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "NO:7\n");
 		return (NULL);
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "YES\n");
 	/* its a preferred address */
 	return (ifa);
 }
 
 static struct sctp_ifa *
 sctp_is_ifa_addr_acceptable(struct sctp_ifa *ifa,
     uint8_t dest_is_loop,
     uint8_t dest_is_priv,
     sa_family_t fam)
 {
 	uint8_t dest_is_global = 0;
 
 	/**
 	 * Here we determine if its a acceptable address. A acceptable
 	 * address means it is the same scope or higher scope but we can
 	 * allow for NAT which means its ok to have a global dest and a
 	 * private src.
 	 *
 	 * L = loopback, P = private, G = global
 	 * -----------------------------------------
 	 *  src    |  dest | result
 	 * -----------------------------------------
 	 *   L     |   L   |    yes
 	 *  -----------------------------------------
 	 *   P     |   L   |    yes-v4 no-v6
 	 *  -----------------------------------------
 	 *   G     |   L   |    yes
 	 * -----------------------------------------
 	 *   L     |   P   |    no
 	 * -----------------------------------------
 	 *   P     |   P   |    yes
 	 * -----------------------------------------
 	 *   G     |   P   |    yes - May not work
 	 * -----------------------------------------
 	 *   L     |   G   |    no
 	 * -----------------------------------------
 	 *   P     |   G   |    yes - May not work
 	 * -----------------------------------------
 	 *   G     |   G   |    yes
 	 * -----------------------------------------
 	 */
 
 	if (ifa->address.sa.sa_family != fam) {
 		/* forget non matching family */
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "ifa_fam:%d fam:%d\n",
 		    ifa->address.sa.sa_family, fam);
 		return (NULL);
 	}
 	/* Ok the address may be ok */
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT3, &ifa->address.sa);
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "dst_is_loop:%d dest_is_priv:%d\n",
 	    dest_is_loop, dest_is_priv);
 	if ((dest_is_loop == 0) && (dest_is_priv == 0)) {
 		dest_is_global = 1;
 	}
 #ifdef INET6
 	if (fam == AF_INET6) {
 		/* ok to use deprecated addresses? */
 		if (ifa->localifa_flags & SCTP_ADDR_IFA_UNUSEABLE) {
 			return (NULL);
 		}
 		if (ifa->src_is_priv) {
 			/* Special case, linklocal to loop */
 			if (dest_is_loop)
 				return (NULL);
 		}
 	}
 #endif
 	/*
 	 * Now that we know what is what, implement our table. This could in
 	 * theory be done slicker (it used to be), but this is
 	 * straightforward and easier to validate :-)
 	 */
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "ifa->src_is_loop:%d dest_is_priv:%d\n",
 	    ifa->src_is_loop,
 	    dest_is_priv);
 	if ((ifa->src_is_loop == 1) && (dest_is_priv)) {
 		return (NULL);
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "ifa->src_is_loop:%d dest_is_glob:%d\n",
 	    ifa->src_is_loop,
 	    dest_is_global);
 	if ((ifa->src_is_loop == 1) && (dest_is_global)) {
 		return (NULL);
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "address is acceptable\n");
 	/* its an acceptable address */
 	return (ifa);
 }
 
 int
 sctp_is_addr_restricted(struct sctp_tcb *stcb, struct sctp_ifa *ifa)
 {
 	struct sctp_laddr *laddr;
 
 	if (stcb == NULL) {
 		/* There are no restrictions, no TCB :-) */
 		return (0);
 	}
 	LIST_FOREACH(laddr, &stcb->asoc.sctp_restricted_addrs, sctp_nxt_addr) {
 		if (laddr->ifa == NULL) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "%s: NULL ifa\n",
 			    __func__);
 			continue;
 		}
 		if (laddr->ifa == ifa) {
 			/* Yes it is on the list */
 			return (1);
 		}
 	}
 	return (0);
 }
 
 int
 sctp_is_addr_in_ep(struct sctp_inpcb *inp, struct sctp_ifa *ifa)
 {
 	struct sctp_laddr *laddr;
 
 	if (ifa == NULL)
 		return (0);
 	LIST_FOREACH(laddr, &inp->sctp_addr_list, sctp_nxt_addr) {
 		if (laddr->ifa == NULL) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "%s: NULL ifa\n",
 			    __func__);
 			continue;
 		}
 		if ((laddr->ifa == ifa) && laddr->action == 0)
 			/* same pointer */
 			return (1);
 	}
 	return (0);
 }
 
 static struct sctp_ifa *
 sctp_choose_boundspecific_inp(struct sctp_inpcb *inp,
     sctp_route_t *ro,
     uint32_t vrf_id,
     int non_asoc_addr_ok,
     uint8_t dest_is_priv,
     uint8_t dest_is_loop,
     sa_family_t fam)
 {
 	struct sctp_laddr *laddr, *starting_point;
 	void *ifn;
 	int resettotop = 0;
 	struct sctp_ifn *sctp_ifn;
 	struct sctp_ifa *sctp_ifa, *sifa;
 	struct sctp_vrf *vrf;
 	uint32_t ifn_index;
 
 	vrf = sctp_find_vrf(vrf_id);
 	if (vrf == NULL)
 		return (NULL);
 
 	ifn = SCTP_GET_IFN_VOID_FROM_ROUTE(ro);
 	ifn_index = SCTP_GET_IF_INDEX_FROM_ROUTE(ro);
 	sctp_ifn = sctp_find_ifn(ifn, ifn_index);
 	/*
 	 * first question, is the ifn we will emit on in our list, if so, we
 	 * want such an address. Note that we first looked for a preferred
 	 * address.
 	 */
 	if (sctp_ifn) {
 		/* is a preferred one on the interface we route out? */
 		LIST_FOREACH(sctp_ifa, &sctp_ifn->ifalist, next_ifa) {
 #ifdef INET
 			if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 			    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin.sin_addr) != 0)) {
 				continue;
 			}
 #endif
 #ifdef INET6
 			if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 			    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 				continue;
 			}
 #endif
 			if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 			    (non_asoc_addr_ok == 0))
 				continue;
 			sifa = sctp_is_ifa_addr_preferred(sctp_ifa,
 			    dest_is_loop,
 			    dest_is_priv, fam);
 			if (sifa == NULL)
 				continue;
 			if (sctp_is_addr_in_ep(inp, sifa)) {
 				atomic_add_int(&sifa->refcount, 1);
 				return (sifa);
 			}
 		}
 	}
 	/*
 	 * ok, now we now need to find one on the list of the addresses. We
 	 * can't get one on the emitting interface so let's find first a
 	 * preferred one. If not that an acceptable one otherwise... we
 	 * return NULL.
 	 */
 	starting_point = inp->next_addr_touse;
 once_again:
 	if (inp->next_addr_touse == NULL) {
 		inp->next_addr_touse = LIST_FIRST(&inp->sctp_addr_list);
 		resettotop = 1;
 	}
 	for (laddr = inp->next_addr_touse; laddr;
 	    laddr = LIST_NEXT(laddr, sctp_nxt_addr)) {
 		if (laddr->ifa == NULL) {
 			/* address has been removed */
 			continue;
 		}
 		if (laddr->action == SCTP_DEL_IP_ADDRESS) {
 			/* address is being deleted */
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_preferred(laddr->ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL)
 			continue;
 		atomic_add_int(&sifa->refcount, 1);
 		return (sifa);
 	}
 	if (resettotop == 0) {
 		inp->next_addr_touse = NULL;
 		goto once_again;
 	}
 
 	inp->next_addr_touse = starting_point;
 	resettotop = 0;
 once_again_too:
 	if (inp->next_addr_touse == NULL) {
 		inp->next_addr_touse = LIST_FIRST(&inp->sctp_addr_list);
 		resettotop = 1;
 	}
 
 	/* ok, what about an acceptable address in the inp */
 	for (laddr = inp->next_addr_touse; laddr;
 	    laddr = LIST_NEXT(laddr, sctp_nxt_addr)) {
 		if (laddr->ifa == NULL) {
 			/* address has been removed */
 			continue;
 		}
 		if (laddr->action == SCTP_DEL_IP_ADDRESS) {
 			/* address is being deleted */
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_acceptable(laddr->ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL)
 			continue;
 		atomic_add_int(&sifa->refcount, 1);
 		return (sifa);
 	}
 	if (resettotop == 0) {
 		inp->next_addr_touse = NULL;
 		goto once_again_too;
 	}
 
 	/*
 	 * no address bound can be a source for the destination we are in
 	 * trouble
 	 */
 	return (NULL);
 }
 
 static struct sctp_ifa *
 sctp_choose_boundspecific_stcb(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     sctp_route_t *ro,
     uint32_t vrf_id,
     uint8_t dest_is_priv,
     uint8_t dest_is_loop,
     int non_asoc_addr_ok,
     sa_family_t fam)
 {
 	struct sctp_laddr *laddr, *starting_point;
 	void *ifn;
 	struct sctp_ifn *sctp_ifn;
 	struct sctp_ifa *sctp_ifa, *sifa;
 	uint8_t start_at_beginning = 0;
 	struct sctp_vrf *vrf;
 	uint32_t ifn_index;
 
 	/*
 	 * first question, is the ifn we will emit on in our list, if so, we
 	 * want that one.
 	 */
 	vrf = sctp_find_vrf(vrf_id);
 	if (vrf == NULL)
 		return (NULL);
 
 	ifn = SCTP_GET_IFN_VOID_FROM_ROUTE(ro);
 	ifn_index = SCTP_GET_IF_INDEX_FROM_ROUTE(ro);
 	sctp_ifn = sctp_find_ifn(ifn, ifn_index);
 
 	/*
 	 * first question, is the ifn we will emit on in our list?  If so,
 	 * we want that one. First we look for a preferred. Second, we go
 	 * for an acceptable.
 	 */
 	if (sctp_ifn) {
 		/* first try for a preferred address on the ep */
 		LIST_FOREACH(sctp_ifa, &sctp_ifn->ifalist, next_ifa) {
 #ifdef INET
 			if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 			    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin.sin_addr) != 0)) {
 				continue;
 			}
 #endif
 #ifdef INET6
 			if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 			    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 				continue;
 			}
 #endif
 			if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) && (non_asoc_addr_ok == 0))
 				continue;
 			if (sctp_is_addr_in_ep(inp, sctp_ifa)) {
 				sifa = sctp_is_ifa_addr_preferred(sctp_ifa, dest_is_loop, dest_is_priv, fam);
 				if (sifa == NULL)
 					continue;
 				if (((non_asoc_addr_ok == 0) &&
 				    (sctp_is_addr_restricted(stcb, sifa))) ||
 				    (non_asoc_addr_ok &&
 				    (sctp_is_addr_restricted(stcb, sifa)) &&
 				    (!sctp_is_addr_pending(stcb, sifa)))) {
 					/* on the no-no list */
 					continue;
 				}
 				atomic_add_int(&sifa->refcount, 1);
 				return (sifa);
 			}
 		}
 		/* next try for an acceptable address on the ep */
 		LIST_FOREACH(sctp_ifa, &sctp_ifn->ifalist, next_ifa) {
 #ifdef INET
 			if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 			    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin.sin_addr) != 0)) {
 				continue;
 			}
 #endif
 #ifdef INET6
 			if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 			    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 				continue;
 			}
 #endif
 			if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) && (non_asoc_addr_ok == 0))
 				continue;
 			if (sctp_is_addr_in_ep(inp, sctp_ifa)) {
 				sifa = sctp_is_ifa_addr_acceptable(sctp_ifa, dest_is_loop, dest_is_priv, fam);
 				if (sifa == NULL)
 					continue;
 				if (((non_asoc_addr_ok == 0) &&
 				    (sctp_is_addr_restricted(stcb, sifa))) ||
 				    (non_asoc_addr_ok &&
 				    (sctp_is_addr_restricted(stcb, sifa)) &&
 				    (!sctp_is_addr_pending(stcb, sifa)))) {
 					/* on the no-no list */
 					continue;
 				}
 				atomic_add_int(&sifa->refcount, 1);
 				return (sifa);
 			}
 		}
 	}
 	/*
 	 * if we can't find one like that then we must look at all addresses
 	 * bound to pick one at first preferable then secondly acceptable.
 	 */
 	starting_point = stcb->asoc.last_used_address;
 sctp_from_the_top:
 	if (stcb->asoc.last_used_address == NULL) {
 		start_at_beginning = 1;
 		stcb->asoc.last_used_address = LIST_FIRST(&inp->sctp_addr_list);
 	}
 	/* search beginning with the last used address */
 	for (laddr = stcb->asoc.last_used_address; laddr;
 	    laddr = LIST_NEXT(laddr, sctp_nxt_addr)) {
 		if (laddr->ifa == NULL) {
 			/* address has been removed */
 			continue;
 		}
 		if (laddr->action == SCTP_DEL_IP_ADDRESS) {
 			/* address is being deleted */
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_preferred(laddr->ifa, dest_is_loop, dest_is_priv, fam);
 		if (sifa == NULL)
 			continue;
 		if (((non_asoc_addr_ok == 0) &&
 		    (sctp_is_addr_restricted(stcb, sifa))) ||
 		    (non_asoc_addr_ok &&
 		    (sctp_is_addr_restricted(stcb, sifa)) &&
 		    (!sctp_is_addr_pending(stcb, sifa)))) {
 			/* on the no-no list */
 			continue;
 		}
 		stcb->asoc.last_used_address = laddr;
 		atomic_add_int(&sifa->refcount, 1);
 		return (sifa);
 	}
 	if (start_at_beginning == 0) {
 		stcb->asoc.last_used_address = NULL;
 		goto sctp_from_the_top;
 	}
 	/* now try for any higher scope than the destination */
 	stcb->asoc.last_used_address = starting_point;
 	start_at_beginning = 0;
 sctp_from_the_top2:
 	if (stcb->asoc.last_used_address == NULL) {
 		start_at_beginning = 1;
 		stcb->asoc.last_used_address = LIST_FIRST(&inp->sctp_addr_list);
 	}
 	/* search beginning with the last used address */
 	for (laddr = stcb->asoc.last_used_address; laddr;
 	    laddr = LIST_NEXT(laddr, sctp_nxt_addr)) {
 		if (laddr->ifa == NULL) {
 			/* address has been removed */
 			continue;
 		}
 		if (laddr->action == SCTP_DEL_IP_ADDRESS) {
 			/* address is being deleted */
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_acceptable(laddr->ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL)
 			continue;
 		if (((non_asoc_addr_ok == 0) &&
 		    (sctp_is_addr_restricted(stcb, sifa))) ||
 		    (non_asoc_addr_ok &&
 		    (sctp_is_addr_restricted(stcb, sifa)) &&
 		    (!sctp_is_addr_pending(stcb, sifa)))) {
 			/* on the no-no list */
 			continue;
 		}
 		stcb->asoc.last_used_address = laddr;
 		atomic_add_int(&sifa->refcount, 1);
 		return (sifa);
 	}
 	if (start_at_beginning == 0) {
 		stcb->asoc.last_used_address = NULL;
 		goto sctp_from_the_top2;
 	}
 	return (NULL);
 }
 
 static struct sctp_ifa *
 sctp_select_nth_preferred_addr_from_ifn_boundall(struct sctp_ifn *ifn,
     struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     int non_asoc_addr_ok,
     uint8_t dest_is_loop,
     uint8_t dest_is_priv,
     int addr_wanted,
     sa_family_t fam,
     sctp_route_t *ro)
 {
 	struct sctp_ifa *ifa, *sifa;
 	int num_eligible_addr = 0;
 #ifdef INET6
 	struct sockaddr_in6 sin6, lsa6;
 
 	if (fam == AF_INET6) {
 		memcpy(&sin6, &ro->ro_dst, sizeof(struct sockaddr_in6));
 		(void)sa6_recoverscope(&sin6);
 	}
 #endif				/* INET6 */
 	LIST_FOREACH(ifa, &ifn->ifalist, next_ifa) {
 #ifdef INET
 		if ((ifa->address.sa.sa_family == AF_INET) &&
 		    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 		    &ifa->address.sin.sin_addr) != 0)) {
 			continue;
 		}
 #endif
 #ifdef INET6
 		if ((ifa->address.sa.sa_family == AF_INET6) &&
 		    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 		    &ifa->address.sin6.sin6_addr) != 0)) {
 			continue;
 		}
 #endif
 		if ((ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 		    (non_asoc_addr_ok == 0))
 			continue;
 		sifa = sctp_is_ifa_addr_preferred(ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL)
 			continue;
 #ifdef INET6
 		if (fam == AF_INET6 &&
 		    dest_is_loop &&
 		    sifa->src_is_loop && sifa->src_is_priv) {
 			/*
 			 * don't allow fe80::1 to be a src on loop ::1, we
 			 * don't list it to the peer so we will get an
 			 * abort.
 			 */
 			continue;
 		}
 		if (fam == AF_INET6 &&
 		    IN6_IS_ADDR_LINKLOCAL(&sifa->address.sin6.sin6_addr) &&
 		    IN6_IS_ADDR_LINKLOCAL(&sin6.sin6_addr)) {
 			/*
 			 * link-local <-> link-local must belong to the same
 			 * scope.
 			 */
 			memcpy(&lsa6, &sifa->address.sin6, sizeof(struct sockaddr_in6));
 			(void)sa6_recoverscope(&lsa6);
 			if (sin6.sin6_scope_id != lsa6.sin6_scope_id) {
 				continue;
 			}
 		}
 #endif				/* INET6 */
 
 		/*
 		 * Check if the IPv6 address matches to next-hop. In the
 		 * mobile case, old IPv6 address may be not deleted from the
 		 * interface. Then, the interface has previous and new
 		 * addresses.  We should use one corresponding to the
 		 * next-hop.  (by micchie)
 		 */
 #ifdef INET6
 		if (stcb && fam == AF_INET6 &&
 		    sctp_is_mobility_feature_on(stcb->sctp_ep, SCTP_MOBILITY_BASE)) {
 			if (sctp_v6src_match_nexthop(&sifa->address.sin6, ro) == 0) {
 				continue;
 			}
 		}
 #endif
 #ifdef INET
 		/* Avoid topologically incorrect IPv4 address */
 		if (stcb && fam == AF_INET &&
 		    sctp_is_mobility_feature_on(stcb->sctp_ep, SCTP_MOBILITY_BASE)) {
 			if (sctp_v4src_match_nexthop(sifa, ro) == 0) {
 				continue;
 			}
 		}
 #endif
 		if (stcb) {
 			if (sctp_is_address_in_scope(ifa, &stcb->asoc.scope, 0) == 0) {
 				continue;
 			}
 			if (((non_asoc_addr_ok == 0) &&
 			    (sctp_is_addr_restricted(stcb, sifa))) ||
 			    (non_asoc_addr_ok &&
 			    (sctp_is_addr_restricted(stcb, sifa)) &&
 			    (!sctp_is_addr_pending(stcb, sifa)))) {
 				/*
 				 * It is restricted for some reason..
 				 * probably not yet added.
 				 */
 				continue;
 			}
 		}
 		if (num_eligible_addr >= addr_wanted) {
 			return (sifa);
 		}
 		num_eligible_addr++;
 	}
 	return (NULL);
 }
 
 static int
 sctp_count_num_preferred_boundall(struct sctp_ifn *ifn,
     struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     int non_asoc_addr_ok,
     uint8_t dest_is_loop,
     uint8_t dest_is_priv,
     sa_family_t fam)
 {
 	struct sctp_ifa *ifa, *sifa;
 	int num_eligible_addr = 0;
 
 	LIST_FOREACH(ifa, &ifn->ifalist, next_ifa) {
 #ifdef INET
 		if ((ifa->address.sa.sa_family == AF_INET) &&
 		    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 		    &ifa->address.sin.sin_addr) != 0)) {
 			continue;
 		}
 #endif
 #ifdef INET6
 		if ((ifa->address.sa.sa_family == AF_INET6) &&
 		    (stcb != NULL) &&
 		    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 		    &ifa->address.sin6.sin6_addr) != 0)) {
 			continue;
 		}
 #endif
 		if ((ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 		    (non_asoc_addr_ok == 0)) {
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_preferred(ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL) {
 			continue;
 		}
 		if (stcb) {
 			if (sctp_is_address_in_scope(ifa, &stcb->asoc.scope, 0) == 0) {
 				continue;
 			}
 			if (((non_asoc_addr_ok == 0) &&
 			    (sctp_is_addr_restricted(stcb, sifa))) ||
 			    (non_asoc_addr_ok &&
 			    (sctp_is_addr_restricted(stcb, sifa)) &&
 			    (!sctp_is_addr_pending(stcb, sifa)))) {
 				/*
 				 * It is restricted for some reason..
 				 * probably not yet added.
 				 */
 				continue;
 			}
 		}
 		num_eligible_addr++;
 	}
 	return (num_eligible_addr);
 }
 
 static struct sctp_ifa *
 sctp_choose_boundall(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     struct sctp_nets *net,
     sctp_route_t *ro,
     uint32_t vrf_id,
     uint8_t dest_is_priv,
     uint8_t dest_is_loop,
     int non_asoc_addr_ok,
     sa_family_t fam)
 {
 	int cur_addr_num = 0, num_preferred = 0;
 	void *ifn;
 	struct sctp_ifn *sctp_ifn, *looked_at = NULL, *emit_ifn;
 	struct sctp_ifa *sctp_ifa, *sifa;
 	uint32_t ifn_index;
 	struct sctp_vrf *vrf;
 #ifdef INET
 	int retried = 0;
 #endif
 
 	/*-
 	 * For boundall we can use any address in the association.
 	 * If non_asoc_addr_ok is set we can use any address (at least in
 	 * theory). So we look for preferred addresses first. If we find one,
 	 * we use it. Otherwise we next try to get an address on the
 	 * interface, which we should be able to do (unless non_asoc_addr_ok
 	 * is false and we are routed out that way). In these cases where we
 	 * can't use the address of the interface we go through all the
 	 * ifn's looking for an address we can use and fill that in. Punting
 	 * means we send back address 0, which will probably cause problems
 	 * actually since then IP will fill in the address of the route ifn,
 	 * which means we probably already rejected it.. i.e. here comes an
 	 * abort :-<.
 	 */
 	vrf = sctp_find_vrf(vrf_id);
 	if (vrf == NULL)
 		return (NULL);
 
 	ifn = SCTP_GET_IFN_VOID_FROM_ROUTE(ro);
 	ifn_index = SCTP_GET_IF_INDEX_FROM_ROUTE(ro);
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "ifn from route:%p ifn_index:%d\n", ifn, ifn_index);
 	emit_ifn = looked_at = sctp_ifn = sctp_find_ifn(ifn, ifn_index);
 	if (sctp_ifn == NULL) {
 		/* ?? We don't have this guy ?? */
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "No ifn emit interface?\n");
 		goto bound_all_plan_b;
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "ifn_index:%d name:%s is emit interface\n",
 	    ifn_index, sctp_ifn->ifn_name);
 
 	if (net) {
 		cur_addr_num = net->indx_of_eligible_next_to_use;
 	}
 	num_preferred = sctp_count_num_preferred_boundall(sctp_ifn,
 	    inp, stcb,
 	    non_asoc_addr_ok,
 	    dest_is_loop,
 	    dest_is_priv, fam);
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Found %d preferred source addresses for intf:%s\n",
 	    num_preferred, sctp_ifn->ifn_name);
 	if (num_preferred == 0) {
 		/*
 		 * no eligible addresses, we must use some other interface
 		 * address if we can find one.
 		 */
 		goto bound_all_plan_b;
 	}
 	/*
 	 * Ok we have num_eligible_addr set with how many we can use, this
 	 * may vary from call to call due to addresses being deprecated
 	 * etc..
 	 */
 	if (cur_addr_num >= num_preferred) {
 		cur_addr_num = 0;
 	}
 	/*
 	 * select the nth address from the list (where cur_addr_num is the
 	 * nth) and 0 is the first one, 1 is the second one etc...
 	 */
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "cur_addr_num:%d\n", cur_addr_num);
 
 	sctp_ifa = sctp_select_nth_preferred_addr_from_ifn_boundall(sctp_ifn, inp, stcb, non_asoc_addr_ok, dest_is_loop,
 	    dest_is_priv, cur_addr_num, fam, ro);
 
 	/* if sctp_ifa is NULL something changed??, fall to plan b. */
 	if (sctp_ifa) {
 		atomic_add_int(&sctp_ifa->refcount, 1);
 		if (net) {
 			/* save off where the next one we will want */
 			net->indx_of_eligible_next_to_use = cur_addr_num + 1;
 		}
 		return (sctp_ifa);
 	}
 	/*
 	 * plan_b: Look at all interfaces and find a preferred address. If
 	 * no preferred fall through to plan_c.
 	 */
 bound_all_plan_b:
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Trying Plan B\n");
 	LIST_FOREACH(sctp_ifn, &vrf->ifnlist, next_ifn) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "Examine interface %s\n",
 		    sctp_ifn->ifn_name);
 		if (dest_is_loop == 0 && SCTP_IFN_IS_IFT_LOOP(sctp_ifn)) {
 			/* wrong base scope */
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "skip\n");
 			continue;
 		}
 		if ((sctp_ifn == looked_at) && looked_at) {
 			/* already looked at this guy */
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "already seen\n");
 			continue;
 		}
 		num_preferred = sctp_count_num_preferred_boundall(sctp_ifn, inp, stcb, non_asoc_addr_ok,
 		    dest_is_loop, dest_is_priv, fam);
 		SCTPDBG(SCTP_DEBUG_OUTPUT2,
 		    "Found ifn:%p %d preferred source addresses\n",
 		    ifn, num_preferred);
 		if (num_preferred == 0) {
 			/* None on this interface. */
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "No preferred -- skipping to next\n");
 			continue;
 		}
 		SCTPDBG(SCTP_DEBUG_OUTPUT2,
 		    "num preferred:%d on interface:%p cur_addr_num:%d\n",
 		    num_preferred, (void *)sctp_ifn, cur_addr_num);
 
 		/*
 		 * Ok we have num_eligible_addr set with how many we can
 		 * use, this may vary from call to call due to addresses
 		 * being deprecated etc..
 		 */
 		if (cur_addr_num >= num_preferred) {
 			cur_addr_num = 0;
 		}
 		sifa = sctp_select_nth_preferred_addr_from_ifn_boundall(sctp_ifn, inp, stcb, non_asoc_addr_ok, dest_is_loop,
 		    dest_is_priv, cur_addr_num, fam, ro);
 		if (sifa == NULL)
 			continue;
 		if (net) {
 			net->indx_of_eligible_next_to_use = cur_addr_num + 1;
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "we selected %d\n",
 			    cur_addr_num);
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "Source:");
 			SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &sifa->address.sa);
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "Dest:");
 			SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &net->ro._l_addr.sa);
 		}
 		atomic_add_int(&sifa->refcount, 1);
 		return (sifa);
 	}
 #ifdef INET
 again_with_private_addresses_allowed:
 #endif
 	/* plan_c: do we have an acceptable address on the emit interface */
 	sifa = NULL;
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Trying Plan C: find acceptable on interface\n");
 	if (emit_ifn == NULL) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "Jump to Plan D - no emit_ifn\n");
 		goto plan_d;
 	}
 	LIST_FOREACH(sctp_ifa, &emit_ifn->ifalist, next_ifa) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "ifa:%p\n", (void *)sctp_ifa);
 #ifdef INET
 		if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 		    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 		    &sctp_ifa->address.sin.sin_addr) != 0)) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "Jailed\n");
 			continue;
 		}
 #endif
 #ifdef INET6
 		if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 		    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 		    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "Jailed\n");
 			continue;
 		}
 #endif
 		if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 		    (non_asoc_addr_ok == 0)) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "Defer\n");
 			continue;
 		}
 		sifa = sctp_is_ifa_addr_acceptable(sctp_ifa, dest_is_loop,
 		    dest_is_priv, fam);
 		if (sifa == NULL) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "IFA not acceptable\n");
 			continue;
 		}
 		if (stcb) {
 			if (sctp_is_address_in_scope(sifa, &stcb->asoc.scope, 0) == 0) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT2, "NOT in scope\n");
 				sifa = NULL;
 				continue;
 			}
 			if (((non_asoc_addr_ok == 0) &&
 			    (sctp_is_addr_restricted(stcb, sifa))) ||
 			    (non_asoc_addr_ok &&
 			    (sctp_is_addr_restricted(stcb, sifa)) &&
 			    (!sctp_is_addr_pending(stcb, sifa)))) {
 				/*
 				 * It is restricted for some reason..
 				 * probably not yet added.
 				 */
 				SCTPDBG(SCTP_DEBUG_OUTPUT2, "Its restricted\n");
 				sifa = NULL;
 				continue;
 			}
 		}
 		atomic_add_int(&sifa->refcount, 1);
 		goto out;
 	}
 plan_d:
 	/*
 	 * plan_d: We are in trouble. No preferred address on the emit
 	 * interface. And not even a preferred address on all interfaces. Go
 	 * out and see if we can find an acceptable address somewhere
 	 * amongst all interfaces.
 	 */
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Trying Plan D looked_at is %p\n", (void *)looked_at);
 	LIST_FOREACH(sctp_ifn, &vrf->ifnlist, next_ifn) {
 		if (dest_is_loop == 0 && SCTP_IFN_IS_IFT_LOOP(sctp_ifn)) {
 			/* wrong base scope */
 			continue;
 		}
 		LIST_FOREACH(sctp_ifa, &sctp_ifn->ifalist, next_ifa) {
 #ifdef INET
 			if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 			    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin.sin_addr) != 0)) {
 				continue;
 			}
 #endif
 #ifdef INET6
 			if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 			    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 			    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 				continue;
 			}
 #endif
 			if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 			    (non_asoc_addr_ok == 0))
 				continue;
 			sifa = sctp_is_ifa_addr_acceptable(sctp_ifa,
 			    dest_is_loop,
 			    dest_is_priv, fam);
 			if (sifa == NULL)
 				continue;
 			if (stcb) {
 				if (sctp_is_address_in_scope(sifa, &stcb->asoc.scope, 0) == 0) {
 					sifa = NULL;
 					continue;
 				}
 				if (((non_asoc_addr_ok == 0) &&
 				    (sctp_is_addr_restricted(stcb, sifa))) ||
 				    (non_asoc_addr_ok &&
 				    (sctp_is_addr_restricted(stcb, sifa)) &&
 				    (!sctp_is_addr_pending(stcb, sifa)))) {
 					/*
 					 * It is restricted for some
 					 * reason.. probably not yet added.
 					 */
 					sifa = NULL;
 					continue;
 				}
 			}
 			goto out;
 		}
 	}
 #ifdef INET
 	if (stcb) {
 		if ((retried == 0) && (stcb->asoc.scope.ipv4_local_scope == 0)) {
 			stcb->asoc.scope.ipv4_local_scope = 1;
 			retried = 1;
 			goto again_with_private_addresses_allowed;
 		} else if (retried == 1) {
 			stcb->asoc.scope.ipv4_local_scope = 0;
 		}
 	}
 #endif
 out:
 #ifdef INET
 	if (sifa) {
 		if (retried == 1) {
 			LIST_FOREACH(sctp_ifn, &vrf->ifnlist, next_ifn) {
 				if (dest_is_loop == 0 && SCTP_IFN_IS_IFT_LOOP(sctp_ifn)) {
 					/* wrong base scope */
 					continue;
 				}
 				LIST_FOREACH(sctp_ifa, &sctp_ifn->ifalist, next_ifa) {
 					struct sctp_ifa *tmp_sifa;
 
 #ifdef INET
 					if ((sctp_ifa->address.sa.sa_family == AF_INET) &&
 					    (prison_check_ip4(inp->ip_inp.inp.inp_cred,
 					    &sctp_ifa->address.sin.sin_addr) != 0)) {
 						continue;
 					}
 #endif
 #ifdef INET6
 					if ((sctp_ifa->address.sa.sa_family == AF_INET6) &&
 					    (prison_check_ip6(inp->ip_inp.inp.inp_cred,
 					    &sctp_ifa->address.sin6.sin6_addr) != 0)) {
 						continue;
 					}
 #endif
 					if ((sctp_ifa->localifa_flags & SCTP_ADDR_DEFER_USE) &&
 					    (non_asoc_addr_ok == 0))
 						continue;
 					tmp_sifa = sctp_is_ifa_addr_acceptable(sctp_ifa,
 					    dest_is_loop,
 					    dest_is_priv, fam);
 					if (tmp_sifa == NULL) {
 						continue;
 					}
 					if (tmp_sifa == sifa) {
 						continue;
 					}
 					if (stcb) {
 						if (sctp_is_address_in_scope(tmp_sifa,
 						    &stcb->asoc.scope, 0) == 0) {
 							continue;
 						}
 						if (((non_asoc_addr_ok == 0) &&
 						    (sctp_is_addr_restricted(stcb, tmp_sifa))) ||
 						    (non_asoc_addr_ok &&
 						    (sctp_is_addr_restricted(stcb, tmp_sifa)) &&
 						    (!sctp_is_addr_pending(stcb, tmp_sifa)))) {
 							/*
 							 * It is restricted
 							 * for some reason..
 							 * probably not yet
 							 * added.
 							 */
 							continue;
 						}
 					}
 					if ((tmp_sifa->address.sin.sin_family == AF_INET) &&
 					    (IN4_ISPRIVATE_ADDRESS(&(tmp_sifa->address.sin.sin_addr)))) {
 						sctp_add_local_addr_restricted(stcb, tmp_sifa);
 					}
 				}
 			}
 		}
 		atomic_add_int(&sifa->refcount, 1);
 	}
 #endif
 	return (sifa);
 }
 
 /* tcb may be NULL */
 struct sctp_ifa *
 sctp_source_address_selection(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     sctp_route_t *ro,
     struct sctp_nets *net,
     int non_asoc_addr_ok, uint32_t vrf_id)
 {
 	struct sctp_ifa *answer;
 	uint8_t dest_is_priv, dest_is_loop;
 	sa_family_t fam;
 #ifdef INET
 	struct sockaddr_in *to = (struct sockaddr_in *)&ro->ro_dst;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 *to6 = (struct sockaddr_in6 *)&ro->ro_dst;
 #endif
 
 	/**
 	 * Rules:
 	 * - Find the route if needed, cache if I can.
 	 * - Look at interface address in route, Is it in the bound list. If so we
 	 *   have the best source.
 	 * - If not we must rotate amongst the addresses.
 	 *
 	 * Caveats and issues
 	 *
 	 * Do we need to pay attention to scope. We can have a private address
 	 * or a global address we are sourcing or sending to. So if we draw
 	 * it out
 	 * zzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzz
 	 * For V4
 	 * ------------------------------------------
 	 *      source     *      dest  *  result
 	 * -----------------------------------------
 	 * <a>  Private    *    Global  *  NAT
 	 * -----------------------------------------
 	 * <b>  Private    *    Private *  No problem
 	 * -----------------------------------------
 	 * <c>  Global     *    Private *  Huh, How will this work?
 	 * -----------------------------------------
 	 * <d>  Global     *    Global  *  No Problem
 	 *------------------------------------------
 	 * zzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzz
 	 * For V6
 	 *------------------------------------------
 	 *      source     *      dest  *  result
 	 * -----------------------------------------
 	 * <a>  Linklocal  *    Global  *
 	 * -----------------------------------------
 	 * <b>  Linklocal  * Linklocal  *  No problem
 	 * -----------------------------------------
 	 * <c>  Global     * Linklocal  *  Huh, How will this work?
 	 * -----------------------------------------
 	 * <d>  Global     *    Global  *  No Problem
 	 *------------------------------------------
 	 * zzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzz
 	 *
 	 * And then we add to that what happens if there are multiple addresses
 	 * assigned to an interface. Remember the ifa on a ifn is a linked
 	 * list of addresses. So one interface can have more than one IP
 	 * address. What happens if we have both a private and a global
 	 * address? Do we then use context of destination to sort out which
 	 * one is best? And what about NAT's sending P->G may get you a NAT
 	 * translation, or should you select the G thats on the interface in
 	 * preference.
 	 *
 	 * Decisions:
 	 *
 	 * - count the number of addresses on the interface.
 	 * - if it is one, no problem except case <c>.
 	 *   For <a> we will assume a NAT out there.
 	 * - if there are more than one, then we need to worry about scope P
 	 *   or G. We should prefer G -> G and P -> P if possible.
 	 *   Then as a secondary fall back to mixed types G->P being a last
 	 *   ditch one.
 	 * - The above all works for bound all, but bound specific we need to
 	 *   use the same concept but instead only consider the bound
 	 *   addresses. If the bound set is NOT assigned to the interface then
 	 *   we must use rotation amongst the bound addresses..
 	 */
 	if (ro->ro_nh == NULL) {
 		/*
 		 * Need a route to cache.
 		 */
 		SCTP_RTALLOC(ro, vrf_id, inp->fibnum);
 	}
 	if (ro->ro_nh == NULL) {
 		return (NULL);
 	}
 	fam = ro->ro_dst.sa_family;
 	dest_is_priv = dest_is_loop = 0;
 	/* Setup our scopes for the destination */
 	switch (fam) {
 #ifdef INET
 	case AF_INET:
 		/* Scope based on outbound address */
 		if (IN4_ISLOOPBACK_ADDRESS(&to->sin_addr)) {
 			dest_is_loop = 1;
 			if (net != NULL) {
 				/* mark it as local */
 				net->addr_is_local = 1;
 			}
 		} else if ((IN4_ISPRIVATE_ADDRESS(&to->sin_addr))) {
 			dest_is_priv = 1;
 		}
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		/* Scope based on outbound address */
 		if (IN6_IS_ADDR_LOOPBACK(&to6->sin6_addr) ||
 		    SCTP_ROUTE_IS_REAL_LOOP(ro)) {
 			/*
 			 * If the address is a loopback address, which
 			 * consists of "::1" OR "fe80::1%lo0", we are
 			 * loopback scope. But we don't use dest_is_priv
 			 * (link local addresses).
 			 */
 			dest_is_loop = 1;
 			if (net != NULL) {
 				/* mark it as local */
 				net->addr_is_local = 1;
 			}
 		} else if (IN6_IS_ADDR_LINKLOCAL(&to6->sin6_addr)) {
 			dest_is_priv = 1;
 		}
 		break;
 #endif
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "Select source addr for:");
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, (struct sockaddr *)&ro->ro_dst);
 	SCTP_IPI_ADDR_RLOCK();
 	if (inp->sctp_flags & SCTP_PCB_FLAGS_BOUNDALL) {
 		/*
 		 * Bound all case
 		 */
 		answer = sctp_choose_boundall(inp, stcb, net, ro, vrf_id,
 		    dest_is_priv, dest_is_loop,
 		    non_asoc_addr_ok, fam);
 		SCTP_IPI_ADDR_RUNLOCK();
 		return (answer);
 	}
 	/*
 	 * Subset bound case
 	 */
 	if (stcb) {
 		answer = sctp_choose_boundspecific_stcb(inp, stcb, ro,
 		    vrf_id, dest_is_priv,
 		    dest_is_loop,
 		    non_asoc_addr_ok, fam);
 	} else {
 		answer = sctp_choose_boundspecific_inp(inp, ro, vrf_id,
 		    non_asoc_addr_ok,
 		    dest_is_priv,
 		    dest_is_loop, fam);
 	}
 	SCTP_IPI_ADDR_RUNLOCK();
 	return (answer);
 }
 
 static bool
 sctp_find_cmsg(int c_type, void *data, struct mbuf *control, size_t cpsize)
 {
 	struct cmsghdr cmh;
 	struct sctp_sndinfo sndinfo;
 	struct sctp_prinfo prinfo;
 	struct sctp_authinfo authinfo;
 	int tot_len, rem_len, cmsg_data_len, cmsg_data_off, off;
 	bool found;
 
 	/*
 	 * Independent of how many mbufs, find the c_type inside the control
 	 * structure and copy out the data.
 	 */
 	found = false;
 	tot_len = SCTP_BUF_LEN(control);
 	for (off = 0; off < tot_len; off += CMSG_ALIGN(cmh.cmsg_len)) {
 		rem_len = tot_len - off;
 		if (rem_len < (int)CMSG_ALIGN(sizeof(cmh))) {
 			/* There is not enough room for one more. */
 			return (found);
 		}
 		m_copydata(control, off, sizeof(cmh), (caddr_t)&cmh);
 		if (cmh.cmsg_len < CMSG_ALIGN(sizeof(cmh))) {
 			/* We dont't have a complete CMSG header. */
 			return (found);
 		}
 		if ((cmh.cmsg_len > INT_MAX) || ((int)cmh.cmsg_len > rem_len)) {
 			/* We don't have the complete CMSG. */
 			return (found);
 		}
 		cmsg_data_len = (int)cmh.cmsg_len - CMSG_ALIGN(sizeof(cmh));
 		cmsg_data_off = off + CMSG_ALIGN(sizeof(cmh));
 		if ((cmh.cmsg_level == IPPROTO_SCTP) &&
 		    ((c_type == cmh.cmsg_type) ||
 		    ((c_type == SCTP_SNDRCV) &&
 		    ((cmh.cmsg_type == SCTP_SNDINFO) ||
 		    (cmh.cmsg_type == SCTP_PRINFO) ||
 		    (cmh.cmsg_type == SCTP_AUTHINFO))))) {
 			if (c_type == cmh.cmsg_type) {
 				if (cpsize > INT_MAX) {
 					return (found);
 				}
 				if (cmsg_data_len < (int)cpsize) {
 					return (found);
 				}
 				/* It is exactly what we want. Copy it out. */
 				m_copydata(control, cmsg_data_off, (int)cpsize, (caddr_t)data);
 				return (1);
 			} else {
 				struct sctp_sndrcvinfo *sndrcvinfo;
 
 				sndrcvinfo = (struct sctp_sndrcvinfo *)data;
 				if (!found) {
 					if (cpsize < sizeof(struct sctp_sndrcvinfo)) {
 						return (found);
 					}
 					memset(sndrcvinfo, 0, sizeof(struct sctp_sndrcvinfo));
 				}
 				switch (cmh.cmsg_type) {
 				case SCTP_SNDINFO:
 					if (cmsg_data_len < (int)sizeof(struct sctp_sndinfo)) {
 						return (found);
 					}
 					m_copydata(control, cmsg_data_off, sizeof(struct sctp_sndinfo), (caddr_t)&sndinfo);
 					sndrcvinfo->sinfo_stream = sndinfo.snd_sid;
 					sndrcvinfo->sinfo_flags = sndinfo.snd_flags;
 					sndrcvinfo->sinfo_ppid = sndinfo.snd_ppid;
 					sndrcvinfo->sinfo_context = sndinfo.snd_context;
 					sndrcvinfo->sinfo_assoc_id = sndinfo.snd_assoc_id;
 					break;
 				case SCTP_PRINFO:
 					if (cmsg_data_len < (int)sizeof(struct sctp_prinfo)) {
 						return (found);
 					}
 					m_copydata(control, cmsg_data_off, sizeof(struct sctp_prinfo), (caddr_t)&prinfo);
 					if (prinfo.pr_policy != SCTP_PR_SCTP_NONE) {
 						sndrcvinfo->sinfo_timetolive = prinfo.pr_value;
 					} else {
 						sndrcvinfo->sinfo_timetolive = 0;
 					}
 					sndrcvinfo->sinfo_flags |= prinfo.pr_policy;
 					break;
 				case SCTP_AUTHINFO:
 					if (cmsg_data_len < (int)sizeof(struct sctp_authinfo)) {
 						return (found);
 					}
 					m_copydata(control, cmsg_data_off, sizeof(struct sctp_authinfo), (caddr_t)&authinfo);
 					sndrcvinfo->sinfo_keynumber_valid = 1;
 					sndrcvinfo->sinfo_keynumber = authinfo.auth_keynumber;
 					break;
 				default:
 					return (found);
 				}
 				found = true;
 			}
 		}
 	}
 	return (found);
 }
 
 static int
 sctp_process_cmsgs_for_init(struct sctp_tcb *stcb, struct mbuf *control, int *error)
 {
 	struct cmsghdr cmh;
 	struct sctp_initmsg initmsg;
 #ifdef INET
 	struct sockaddr_in sin;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 sin6;
 #endif
 	int tot_len, rem_len, cmsg_data_len, cmsg_data_off, off;
 
 	tot_len = SCTP_BUF_LEN(control);
 	for (off = 0; off < tot_len; off += CMSG_ALIGN(cmh.cmsg_len)) {
 		rem_len = tot_len - off;
 		if (rem_len < (int)CMSG_ALIGN(sizeof(cmh))) {
 			/* There is not enough room for one more. */
 			*error = EINVAL;
 			return (1);
 		}
 		m_copydata(control, off, sizeof(cmh), (caddr_t)&cmh);
 		if (cmh.cmsg_len < CMSG_ALIGN(sizeof(cmh))) {
 			/* We dont't have a complete CMSG header. */
 			*error = EINVAL;
 			return (1);
 		}
 		if ((cmh.cmsg_len > INT_MAX) || ((int)cmh.cmsg_len > rem_len)) {
 			/* We don't have the complete CMSG. */
 			*error = EINVAL;
 			return (1);
 		}
 		cmsg_data_len = (int)cmh.cmsg_len - CMSG_ALIGN(sizeof(cmh));
 		cmsg_data_off = off + CMSG_ALIGN(sizeof(cmh));
 		if (cmh.cmsg_level == IPPROTO_SCTP) {
 			switch (cmh.cmsg_type) {
 			case SCTP_INIT:
 				if (cmsg_data_len < (int)sizeof(struct sctp_initmsg)) {
 					*error = EINVAL;
 					return (1);
 				}
 				m_copydata(control, cmsg_data_off, sizeof(struct sctp_initmsg), (caddr_t)&initmsg);
 				if (initmsg.sinit_max_attempts)
 					stcb->asoc.max_init_times = initmsg.sinit_max_attempts;
 				if (initmsg.sinit_num_ostreams)
 					stcb->asoc.pre_open_streams = initmsg.sinit_num_ostreams;
 				if (initmsg.sinit_max_instreams)
 					stcb->asoc.max_inbound_streams = initmsg.sinit_max_instreams;
 				if (initmsg.sinit_max_init_timeo)
 					stcb->asoc.initial_init_rto_max = initmsg.sinit_max_init_timeo;
 				if (stcb->asoc.streamoutcnt < stcb->asoc.pre_open_streams) {
 					struct sctp_stream_out *tmp_str;
 					unsigned int i;
 #if defined(SCTP_DETAILED_STR_STATS)
 					int j;
 #endif
 
 					/* Default is NOT correct */
 					SCTPDBG(SCTP_DEBUG_OUTPUT1, "Ok, default:%d pre_open:%d\n",
 					    stcb->asoc.streamoutcnt, stcb->asoc.pre_open_streams);
 					SCTP_TCB_UNLOCK(stcb);
 					SCTP_MALLOC(tmp_str,
 					    struct sctp_stream_out *,
 					    (stcb->asoc.pre_open_streams * sizeof(struct sctp_stream_out)),
 					    SCTP_M_STRMO);
 					SCTP_TCB_LOCK(stcb);
 					if (tmp_str != NULL) {
 						SCTP_FREE(stcb->asoc.strmout, SCTP_M_STRMO);
 						stcb->asoc.strmout = tmp_str;
 						stcb->asoc.strm_realoutsize = stcb->asoc.streamoutcnt = stcb->asoc.pre_open_streams;
 					} else {
 						stcb->asoc.pre_open_streams = stcb->asoc.streamoutcnt;
 					}
 					for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 						TAILQ_INIT(&stcb->asoc.strmout[i].outqueue);
 						stcb->asoc.ss_functions.sctp_ss_init_stream(stcb, &stcb->asoc.strmout[i], NULL);
 						stcb->asoc.strmout[i].chunks_on_queues = 0;
 #if defined(SCTP_DETAILED_STR_STATS)
 						for (j = 0; j < SCTP_PR_SCTP_MAX + 1; j++) {
 							stcb->asoc.strmout[i].abandoned_sent[j] = 0;
 							stcb->asoc.strmout[i].abandoned_unsent[j] = 0;
 						}
 #else
 						stcb->asoc.strmout[i].abandoned_sent[0] = 0;
 						stcb->asoc.strmout[i].abandoned_unsent[0] = 0;
 #endif
 						stcb->asoc.strmout[i].next_mid_ordered = 0;
 						stcb->asoc.strmout[i].next_mid_unordered = 0;
 						stcb->asoc.strmout[i].sid = i;
 						stcb->asoc.strmout[i].last_msg_incomplete = 0;
 						stcb->asoc.strmout[i].state = SCTP_STREAM_OPENING;
 					}
 				}
 				break;
 #ifdef INET
 			case SCTP_DSTADDRV4:
 				if (cmsg_data_len < (int)sizeof(struct in_addr)) {
 					*error = EINVAL;
 					return (1);
 				}
 				memset(&sin, 0, sizeof(struct sockaddr_in));
 				sin.sin_family = AF_INET;
 				sin.sin_len = sizeof(struct sockaddr_in);
 				sin.sin_port = stcb->rport;
 				m_copydata(control, cmsg_data_off, sizeof(struct in_addr), (caddr_t)&sin.sin_addr);
 				if ((sin.sin_addr.s_addr == INADDR_ANY) ||
 				    (sin.sin_addr.s_addr == INADDR_BROADCAST) ||
 				    IN_MULTICAST(ntohl(sin.sin_addr.s_addr))) {
 					*error = EINVAL;
 					return (1);
 				}
 				if (sctp_add_remote_addr(stcb, (struct sockaddr *)&sin, NULL, stcb->asoc.port,
 				    SCTP_DONOT_SETSCOPE, SCTP_ADDR_IS_CONFIRMED)) {
 					*error = ENOBUFS;
 					return (1);
 				}
 				break;
 #endif
 #ifdef INET6
 			case SCTP_DSTADDRV6:
 				if (cmsg_data_len < (int)sizeof(struct in6_addr)) {
 					*error = EINVAL;
 					return (1);
 				}
 				memset(&sin6, 0, sizeof(struct sockaddr_in6));
 				sin6.sin6_family = AF_INET6;
 				sin6.sin6_len = sizeof(struct sockaddr_in6);
 				sin6.sin6_port = stcb->rport;
 				m_copydata(control, cmsg_data_off, sizeof(struct in6_addr), (caddr_t)&sin6.sin6_addr);
 				if (IN6_IS_ADDR_UNSPECIFIED(&sin6.sin6_addr) ||
 				    IN6_IS_ADDR_MULTICAST(&sin6.sin6_addr)) {
 					*error = EINVAL;
 					return (1);
 				}
 #ifdef INET
 				if (IN6_IS_ADDR_V4MAPPED(&sin6.sin6_addr)) {
 					in6_sin6_2_sin(&sin, &sin6);
 					if ((sin.sin_addr.s_addr == INADDR_ANY) ||
 					    (sin.sin_addr.s_addr == INADDR_BROADCAST) ||
 					    IN_MULTICAST(ntohl(sin.sin_addr.s_addr))) {
 						*error = EINVAL;
 						return (1);
 					}
 					if (sctp_add_remote_addr(stcb, (struct sockaddr *)&sin, NULL, stcb->asoc.port,
 					    SCTP_DONOT_SETSCOPE, SCTP_ADDR_IS_CONFIRMED)) {
 						*error = ENOBUFS;
 						return (1);
 					}
 				} else
 #endif
 					if (sctp_add_remote_addr(stcb, (struct sockaddr *)&sin6, NULL, stcb->asoc.port,
 				    SCTP_DONOT_SETSCOPE, SCTP_ADDR_IS_CONFIRMED)) {
 					*error = ENOBUFS;
 					return (1);
 				}
 				break;
 #endif
 			default:
 				break;
 			}
 		}
 	}
 	return (0);
 }
 
 #if defined(INET) || defined(INET6)
 static struct sctp_tcb *
 sctp_findassociation_cmsgs(struct sctp_inpcb **inp_p,
     uint16_t port,
     struct mbuf *control,
     struct sctp_nets **net_p,
     int *error)
 {
 	struct cmsghdr cmh;
 	struct sctp_tcb *stcb;
 	struct sockaddr *addr;
 #ifdef INET
 	struct sockaddr_in sin;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 sin6;
 #endif
 	int tot_len, rem_len, cmsg_data_len, cmsg_data_off, off;
 
 	tot_len = SCTP_BUF_LEN(control);
 	for (off = 0; off < tot_len; off += CMSG_ALIGN(cmh.cmsg_len)) {
 		rem_len = tot_len - off;
 		if (rem_len < (int)CMSG_ALIGN(sizeof(cmh))) {
 			/* There is not enough room for one more. */
 			*error = EINVAL;
 			return (NULL);
 		}
 		m_copydata(control, off, sizeof(cmh), (caddr_t)&cmh);
 		if (cmh.cmsg_len < CMSG_ALIGN(sizeof(cmh))) {
 			/* We dont't have a complete CMSG header. */
 			*error = EINVAL;
 			return (NULL);
 		}
 		if ((cmh.cmsg_len > INT_MAX) || ((int)cmh.cmsg_len > rem_len)) {
 			/* We don't have the complete CMSG. */
 			*error = EINVAL;
 			return (NULL);
 		}
 		cmsg_data_len = (int)cmh.cmsg_len - CMSG_ALIGN(sizeof(cmh));
 		cmsg_data_off = off + CMSG_ALIGN(sizeof(cmh));
 		if (cmh.cmsg_level == IPPROTO_SCTP) {
 			switch (cmh.cmsg_type) {
 #ifdef INET
 			case SCTP_DSTADDRV4:
 				if (cmsg_data_len < (int)sizeof(struct in_addr)) {
 					*error = EINVAL;
 					return (NULL);
 				}
 				memset(&sin, 0, sizeof(struct sockaddr_in));
 				sin.sin_family = AF_INET;
 				sin.sin_len = sizeof(struct sockaddr_in);
 				sin.sin_port = port;
 				m_copydata(control, cmsg_data_off, sizeof(struct in_addr), (caddr_t)&sin.sin_addr);
 				addr = (struct sockaddr *)&sin;
 				break;
 #endif
 #ifdef INET6
 			case SCTP_DSTADDRV6:
 				if (cmsg_data_len < (int)sizeof(struct in6_addr)) {
 					*error = EINVAL;
 					return (NULL);
 				}
 				memset(&sin6, 0, sizeof(struct sockaddr_in6));
 				sin6.sin6_family = AF_INET6;
 				sin6.sin6_len = sizeof(struct sockaddr_in6);
 				sin6.sin6_port = port;
 				m_copydata(control, cmsg_data_off, sizeof(struct in6_addr), (caddr_t)&sin6.sin6_addr);
 #ifdef INET
 				if (IN6_IS_ADDR_V4MAPPED(&sin6.sin6_addr)) {
 					in6_sin6_2_sin(&sin, &sin6);
 					addr = (struct sockaddr *)&sin;
 				} else
 #endif
 					addr = (struct sockaddr *)&sin6;
 				break;
 #endif
 			default:
 				addr = NULL;
 				break;
 			}
 			if (addr) {
 				stcb = sctp_findassociation_ep_addr(inp_p, addr, net_p, NULL, NULL);
 				if (stcb != NULL) {
 					return (stcb);
 				}
 			}
 		}
 	}
 	return (NULL);
 }
 #endif
 
 static struct mbuf *
 sctp_add_cookie(struct mbuf *init, int init_offset,
     struct mbuf *initack, int initack_offset, struct sctp_state_cookie *stc_in, uint8_t **signature)
 {
 	struct mbuf *copy_init, *copy_initack, *m_at, *sig, *mret;
 	struct sctp_state_cookie *stc;
 	struct sctp_paramhdr *ph;
 	uint16_t cookie_sz;
 
 	mret = sctp_get_mbuf_for_msg((sizeof(struct sctp_state_cookie) +
 	    sizeof(struct sctp_paramhdr)), 0,
 	    M_NOWAIT, 1, MT_DATA);
 	if (mret == NULL) {
 		return (NULL);
 	}
 	copy_init = SCTP_M_COPYM(init, init_offset, M_COPYALL, M_NOWAIT);
 	if (copy_init == NULL) {
 		sctp_m_freem(mret);
 		return (NULL);
 	}
 #ifdef SCTP_MBUF_LOGGING
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 		sctp_log_mbc(copy_init, SCTP_MBUF_ICOPY);
 	}
 #endif
 	copy_initack = SCTP_M_COPYM(initack, initack_offset, M_COPYALL,
 	    M_NOWAIT);
 	if (copy_initack == NULL) {
 		sctp_m_freem(mret);
 		sctp_m_freem(copy_init);
 		return (NULL);
 	}
 #ifdef SCTP_MBUF_LOGGING
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 		sctp_log_mbc(copy_initack, SCTP_MBUF_ICOPY);
 	}
 #endif
 	/* easy side we just drop it on the end */
 	ph = mtod(mret, struct sctp_paramhdr *);
 	SCTP_BUF_LEN(mret) = sizeof(struct sctp_state_cookie) +
 	    sizeof(struct sctp_paramhdr);
 	stc = (struct sctp_state_cookie *)((caddr_t)ph +
 	    sizeof(struct sctp_paramhdr));
 	ph->param_type = htons(SCTP_STATE_COOKIE);
 	ph->param_length = 0;	/* fill in at the end */
 	/* Fill in the stc cookie data */
 	memcpy(stc, stc_in, sizeof(struct sctp_state_cookie));
 
 	/* tack the INIT and then the INIT-ACK onto the chain */
 	cookie_sz = 0;
 	for (m_at = mret; m_at; m_at = SCTP_BUF_NEXT(m_at)) {
 		cookie_sz += SCTP_BUF_LEN(m_at);
 		if (SCTP_BUF_NEXT(m_at) == NULL) {
 			SCTP_BUF_NEXT(m_at) = copy_init;
 			break;
 		}
 	}
 	for (m_at = copy_init; m_at; m_at = SCTP_BUF_NEXT(m_at)) {
 		cookie_sz += SCTP_BUF_LEN(m_at);
 		if (SCTP_BUF_NEXT(m_at) == NULL) {
 			SCTP_BUF_NEXT(m_at) = copy_initack;
 			break;
 		}
 	}
 	for (m_at = copy_initack; m_at; m_at = SCTP_BUF_NEXT(m_at)) {
 		cookie_sz += SCTP_BUF_LEN(m_at);
 		if (SCTP_BUF_NEXT(m_at) == NULL) {
 			break;
 		}
 	}
 	sig = sctp_get_mbuf_for_msg(SCTP_SIGNATURE_SIZE, 0, M_NOWAIT, 1, MT_DATA);
 	if (sig == NULL) {
 		/* no space, so free the entire chain */
 		sctp_m_freem(mret);
 		return (NULL);
 	}
 	SCTP_BUF_NEXT(m_at) = sig;
 	SCTP_BUF_LEN(sig) = SCTP_SIGNATURE_SIZE;
 	cookie_sz += SCTP_SIGNATURE_SIZE;
 	ph->param_length = htons(cookie_sz);
 	*signature = (uint8_t *)mtod(sig, caddr_t);
 	memset(*signature, 0, SCTP_SIGNATURE_SIZE);
 	return (mret);
 }
 
 static uint8_t
 sctp_get_ect(struct sctp_tcb *stcb)
 {
 	if ((stcb != NULL) && (stcb->asoc.ecn_supported == 1)) {
 		return (SCTP_ECT0_BIT);
 	} else {
 		return (0);
 	}
 }
 
 #if defined(INET) || defined(INET6)
 static void
 sctp_handle_no_route(struct sctp_tcb *stcb,
     struct sctp_nets *net,
     int so_locked)
 {
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "dropped packet - no valid source addr\n");
 
 	if (net) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT1, "Destination was ");
 		SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT1, &net->ro._l_addr.sa);
 		if (net->dest_state & SCTP_ADDR_CONFIRMED) {
 			if ((net->dest_state & SCTP_ADDR_REACHABLE) && stcb) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "no route takes interface %p down\n", (void *)net);
 				sctp_ulp_notify(SCTP_NOTIFY_INTERFACE_DOWN,
 				    stcb, 0,
 				    (void *)net,
 				    so_locked);
 				net->dest_state &= ~SCTP_ADDR_REACHABLE;
 				net->dest_state &= ~SCTP_ADDR_PF;
 			}
 		}
 		if (stcb) {
 			if (net == stcb->asoc.primary_destination) {
 				/* need a new primary */
 				struct sctp_nets *alt;
 
 				alt = sctp_find_alternate_net(stcb, net, 0);
 				if (alt != net) {
 					if (stcb->asoc.alternate) {
 						sctp_free_remote_addr(stcb->asoc.alternate);
 					}
 					stcb->asoc.alternate = alt;
 					atomic_add_int(&stcb->asoc.alternate->ref_count, 1);
 					if (net->ro._s_addr) {
 						sctp_free_ifa(net->ro._s_addr);
 						net->ro._s_addr = NULL;
 					}
 					net->src_addr_selected = 0;
 				}
 			}
 		}
 	}
 }
 #endif
 
 static int
 sctp_lowlevel_chunk_output(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,	/* may be NULL */
     struct sctp_nets *net,
     struct sockaddr *to,
     struct mbuf *m,
     uint32_t auth_offset,
     struct sctp_auth_chunk *auth,
     uint16_t auth_keyid,
     int nofragment_flag,
     int ecn_ok,
     int out_of_asoc_ok,
     uint16_t src_port,
     uint16_t dest_port,
     uint32_t v_tag,
     uint16_t port,
     union sctp_sockstore *over_addr,
     uint8_t mflowtype, uint32_t mflowid,
     bool use_zero_crc,
     int so_locked)
 {
 /* nofragment_flag to tell if IP_DF should be set (IPv4 only) */
 	/**
 	 * Given a mbuf chain (via SCTP_BUF_NEXT()) that holds a packet header
 	 * WITH an SCTPHDR but no IP header, endpoint inp and sa structure:
 	 * - fill in the HMAC digest of any AUTH chunk in the packet.
 	 * - calculate and fill in the SCTP checksum.
 	 * - prepend an IP address header.
 	 * - if boundall use INADDR_ANY.
 	 * - if boundspecific do source address selection.
 	 * - set fragmentation option for ipV4.
 	 * - On return from IP output, check/adjust mtu size of output
 	 *   interface and smallest_mtu size as well.
 	 */
 	/* Will need ifdefs around this */
 	struct mbuf *newm;
 	struct sctphdr *sctphdr;
 	int packet_length;
 	int ret;
 #if defined(INET) || defined(INET6)
 	uint32_t vrf_id;
 #endif
 #if defined(INET) || defined(INET6)
 	struct mbuf *o_pak;
 	sctp_route_t *ro = NULL;
 	struct udphdr *udp = NULL;
 #endif
 	uint8_t tos_value;
 
 	if ((net) && (net->dest_state & SCTP_ADDR_OUT_OF_SCOPE)) {
 		SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		sctp_m_freem(m);
 		return (EFAULT);
 	}
 #if defined(INET) || defined(INET6)
 	if (stcb) {
 		vrf_id = stcb->asoc.vrf_id;
 	} else {
 		vrf_id = inp->def_vrf_id;
 	}
 #endif
 	/* fill in the HMAC digest for any AUTH chunk in the packet */
 	if ((auth != NULL) && (stcb != NULL)) {
 		sctp_fill_hmac_digest_m(m, auth_offset, auth, stcb, auth_keyid);
 	}
 
 	if (net) {
 		tos_value = net->dscp;
 	} else if (stcb) {
 		tos_value = stcb->asoc.default_dscp;
 	} else {
 		tos_value = inp->sctp_ep.default_dscp;
 	}
 
 	switch (to->sa_family) {
 #ifdef INET
 	case AF_INET:
 		{
 			struct ip *ip = NULL;
 			sctp_route_t iproute;
 			int len;
 
 			len = SCTP_MIN_V4_OVERHEAD;
 			if (port) {
 				len += sizeof(struct udphdr);
 			}
 			newm = sctp_get_mbuf_for_msg(len, 1, M_NOWAIT, 1, MT_DATA);
 			if (newm == NULL) {
 				sctp_m_freem(m);
 				SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 				return (ENOMEM);
 			}
 			SCTP_ALIGN_TO_END(newm, len);
 			SCTP_BUF_LEN(newm) = len;
 			SCTP_BUF_NEXT(newm) = m;
 			m = newm;
 			if (net != NULL) {
 				m->m_pkthdr.flowid = net->flowid;
 				M_HASHTYPE_SET(m, net->flowtype);
 			} else {
 				m->m_pkthdr.flowid = mflowid;
 				M_HASHTYPE_SET(m, mflowtype);
 			}
 			packet_length = sctp_calculate_len(m);
 			ip = mtod(m, struct ip *);
 			ip->ip_v = IPVERSION;
 			ip->ip_hl = (sizeof(struct ip) >> 2);
 			if (tos_value == 0) {
 				/*
 				 * This means especially, that it is not set
 				 * at the SCTP layer. So use the value from
 				 * the IP layer.
 				 */
 				tos_value = inp->ip_inp.inp.inp_ip_tos;
 			}
 			tos_value &= 0xfc;
 			if (ecn_ok) {
 				tos_value |= sctp_get_ect(stcb);
 			}
 			if ((nofragment_flag) && (port == 0)) {
 				ip->ip_off = htons(IP_DF);
 			} else {
 				ip->ip_off = htons(0);
 			}
 			/* FreeBSD has a function for ip_id's */
 			ip_fillid(ip);
 
 			ip->ip_ttl = inp->ip_inp.inp.inp_ip_ttl;
 			ip->ip_len = htons(packet_length);
 			ip->ip_tos = tos_value;
 			if (port) {
 				ip->ip_p = IPPROTO_UDP;
 			} else {
 				ip->ip_p = IPPROTO_SCTP;
 			}
 			ip->ip_sum = 0;
 			if (net == NULL) {
 				ro = &iproute;
 				memset(&iproute, 0, sizeof(iproute));
 				memcpy(&ro->ro_dst, to, to->sa_len);
 			} else {
 				ro = (sctp_route_t *)&net->ro;
 			}
 			/* Now the address selection part */
 			ip->ip_dst.s_addr = ((struct sockaddr_in *)to)->sin_addr.s_addr;
 
 			/* call the routine to select the src address */
 			if (net && out_of_asoc_ok == 0) {
 				if (net->ro._s_addr && (net->ro._s_addr->localifa_flags & (SCTP_BEING_DELETED | SCTP_ADDR_IFA_UNUSEABLE))) {
 					sctp_free_ifa(net->ro._s_addr);
 					net->ro._s_addr = NULL;
 					net->src_addr_selected = 0;
 					RO_NHFREE(ro);
 				}
 				if (net->src_addr_selected == 0) {
 					/* Cache the source address */
 					net->ro._s_addr = sctp_source_address_selection(inp, stcb,
 					    ro, net, 0,
 					    vrf_id);
 					net->src_addr_selected = 1;
 				}
 				if (net->ro._s_addr == NULL) {
 					/* No route to host */
 					net->src_addr_selected = 0;
 					sctp_handle_no_route(stcb, net, so_locked);
 					SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 					sctp_m_freem(m);
 					return (EHOSTUNREACH);
 				}
 				ip->ip_src = net->ro._s_addr->address.sin.sin_addr;
 			} else {
 				if (over_addr == NULL) {
 					struct sctp_ifa *_lsrc;
 
 					_lsrc = sctp_source_address_selection(inp, stcb, ro,
 					    net,
 					    out_of_asoc_ok,
 					    vrf_id);
 					if (_lsrc == NULL) {
 						sctp_handle_no_route(stcb, net, so_locked);
 						SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 						sctp_m_freem(m);
 						return (EHOSTUNREACH);
 					}
 					ip->ip_src = _lsrc->address.sin.sin_addr;
 					sctp_free_ifa(_lsrc);
 				} else {
 					ip->ip_src = over_addr->sin.sin_addr;
 					SCTP_RTALLOC(ro, vrf_id, inp->fibnum);
 				}
 			}
 			if (port) {
 				if (htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port)) == 0) {
 					sctp_handle_no_route(stcb, net, so_locked);
 					SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 					sctp_m_freem(m);
 					return (EHOSTUNREACH);
 				}
 				udp = (struct udphdr *)((caddr_t)ip + sizeof(struct ip));
 				udp->uh_sport = htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port));
 				udp->uh_dport = port;
 				udp->uh_ulen = htons((uint16_t)(packet_length - sizeof(struct ip)));
 				if (V_udp_cksum) {
 					udp->uh_sum = in_pseudo(ip->ip_src.s_addr, ip->ip_dst.s_addr, udp->uh_ulen + htons(IPPROTO_UDP));
 				} else {
 					udp->uh_sum = 0;
 				}
 				sctphdr = (struct sctphdr *)((caddr_t)udp + sizeof(struct udphdr));
 			} else {
 				sctphdr = (struct sctphdr *)((caddr_t)ip + sizeof(struct ip));
 			}
 
 			sctphdr->src_port = src_port;
 			sctphdr->dest_port = dest_port;
 			sctphdr->v_tag = v_tag;
 			sctphdr->checksum = 0;
 
 			/*
 			 * If source address selection fails and we find no
 			 * route then the ip_output should fail as well with
 			 * a NO_ROUTE_TO_HOST type error. We probably should
 			 * catch that somewhere and abort the association
 			 * right away (assuming this is an INIT being sent).
 			 */
 			if (ro->ro_nh == NULL) {
 				/*
 				 * src addr selection failed to find a route
 				 * (or valid source addr), so we can't get
 				 * there from here (yet)!
 				 */
 				sctp_handle_no_route(stcb, net, so_locked);
 				SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 				sctp_m_freem(m);
 				return (EHOSTUNREACH);
 			}
 			if (ro != &iproute) {
 				memcpy(&iproute, ro, sizeof(*ro));
 			}
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "Calling ipv4 output routine from low level src addr:%x\n",
 			    (uint32_t)(ntohl(ip->ip_src.s_addr)));
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "Destination is %x\n",
 			    (uint32_t)(ntohl(ip->ip_dst.s_addr)));
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "RTP route is %p through\n",
 			    (void *)ro->ro_nh);
 
 			if (SCTP_GET_HEADER_FOR_OUTPUT(o_pak)) {
 				/* failed to prepend data, give up */
 				SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 				sctp_m_freem(m);
 				return (ENOMEM);
 			}
 			SCTP_ATTACH_CHAIN(o_pak, m, packet_length);
 			if (port) {
 				if (use_zero_crc) {
 					SCTP_STAT_INCR(sctps_sendzerocrc);
 				} else {
 					sctphdr->checksum = sctp_calculate_cksum(m, sizeof(struct ip) + sizeof(struct udphdr));
 					SCTP_STAT_INCR(sctps_sendswcrc);
 				}
 				if (V_udp_cksum) {
 					SCTP_ENABLE_UDP_CSUM(o_pak);
 				}
 			} else {
 				if (use_zero_crc) {
 					SCTP_STAT_INCR(sctps_sendzerocrc);
 				} else {
 					m->m_pkthdr.csum_flags = CSUM_SCTP;
 					m->m_pkthdr.csum_data = offsetof(struct sctphdr, checksum);
 					SCTP_STAT_INCR(sctps_sendhwcrc);
 				}
 			}
 #ifdef SCTP_PACKET_LOGGING
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LAST_PACKET_TRACING)
 				sctp_packet_log(o_pak);
 #endif
 			/* send it out.  table id is taken from stcb */
 			SCTP_PROBE5(send, NULL, stcb, ip, stcb, sctphdr);
 			SCTP_IP_OUTPUT(ret, o_pak, ro, inp, vrf_id);
 			if (port) {
 				UDPSTAT_INC(udps_opackets);
 			}
 			SCTP_STAT_INCR(sctps_sendpackets);
 			SCTP_STAT_INCR_COUNTER64(sctps_outpackets);
 			if (ret)
 				SCTP_STAT_INCR(sctps_senderrors);
 
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "IP output returns %d\n", ret);
 			if (net == NULL) {
 				/* free tempy routes */
 				RO_NHFREE(ro);
 			} else {
 				if ((ro->ro_nh != NULL) && (net->ro._s_addr) &&
 				    ((net->dest_state & SCTP_ADDR_NO_PMTUD) == 0)) {
 					uint32_t mtu;
 
 					mtu = SCTP_GATHER_MTU_FROM_ROUTE(net->ro._s_addr, &net->ro._l_addr.sa, ro->ro_nh);
 					if (mtu > 0) {
 						if (net->port) {
 							mtu -= sizeof(struct udphdr);
 						}
 						if (mtu < net->mtu) {
 							net->mtu = mtu;
 							if ((stcb != NULL) && (stcb->asoc.smallest_mtu > mtu)) {
 								sctp_pathmtu_adjustment(stcb, mtu, true);
 							}
 						}
 					}
 				} else if (ro->ro_nh == NULL) {
 					/* route was freed */
 					if (net->ro._s_addr &&
 					    net->src_addr_selected) {
 						sctp_free_ifa(net->ro._s_addr);
 						net->ro._s_addr = NULL;
 					}
 					net->src_addr_selected = 0;
 				}
 			}
 			return (ret);
 		}
 #endif
 #ifdef INET6
 	case AF_INET6:
 		{
 			uint32_t flowlabel, flowinfo;
 			struct ip6_hdr *ip6h;
 			struct route_in6 ip6route;
 			struct ifnet *ifp;
 			struct sockaddr_in6 *sin6, tmp, *lsa6, lsa6_tmp;
 			int prev_scope = 0;
 			struct sockaddr_in6 lsa6_storage;
 			int error;
 			u_short prev_port = 0;
 			int len;
 
 			if (net) {
 				flowlabel = net->flowlabel;
 			} else if (stcb) {
 				flowlabel = stcb->asoc.default_flowlabel;
 			} else {
 				flowlabel = inp->sctp_ep.default_flowlabel;
 			}
 			if (flowlabel == 0) {
 				/*
 				 * This means especially, that it is not set
 				 * at the SCTP layer. So use the value from
 				 * the IP layer.
 				 */
 				flowlabel = ntohl(((struct inpcb *)inp)->inp_flow);
 			}
 			flowlabel &= 0x000fffff;
 			len = SCTP_MIN_OVERHEAD;
 			if (port) {
 				len += sizeof(struct udphdr);
 			}
 			newm = sctp_get_mbuf_for_msg(len, 1, M_NOWAIT, 1, MT_DATA);
 			if (newm == NULL) {
 				sctp_m_freem(m);
 				SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 				return (ENOMEM);
 			}
 			SCTP_ALIGN_TO_END(newm, len);
 			SCTP_BUF_LEN(newm) = len;
 			SCTP_BUF_NEXT(newm) = m;
 			m = newm;
 			if (net != NULL) {
 				m->m_pkthdr.flowid = net->flowid;
 				M_HASHTYPE_SET(m, net->flowtype);
 			} else {
 				m->m_pkthdr.flowid = mflowid;
 				M_HASHTYPE_SET(m, mflowtype);
 			}
 			packet_length = sctp_calculate_len(m);
 
 			ip6h = mtod(m, struct ip6_hdr *);
 			/* protect *sin6 from overwrite */
 			sin6 = (struct sockaddr_in6 *)to;
 			tmp = *sin6;
 			sin6 = &tmp;
 
 			/* KAME hack: embed scopeid */
 			if (sa6_embedscope(sin6, MODULE_GLOBAL(ip6_use_defzone)) != 0) {
 				SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 				sctp_m_freem(m);
 				return (EINVAL);
 			}
 			if (net == NULL) {
 				memset(&ip6route, 0, sizeof(ip6route));
 				ro = (sctp_route_t *)&ip6route;
 				memcpy(&ro->ro_dst, sin6, sin6->sin6_len);
 			} else {
 				ro = (sctp_route_t *)&net->ro;
 			}
 			/*
 			 * We assume here that inp_flow is in host byte
 			 * order within the TCB!
 			 */
 			if (tos_value == 0) {
 				/*
 				 * This means especially, that it is not set
 				 * at the SCTP layer. So use the value from
 				 * the IP layer.
 				 */
 				tos_value = (ntohl(((struct inpcb *)inp)->inp_flow) >> 20) & 0xff;
 			}
 			tos_value &= 0xfc;
 			if (ecn_ok) {
 				tos_value |= sctp_get_ect(stcb);
 			}
 			flowinfo = 0x06;
 			flowinfo <<= 8;
 			flowinfo |= tos_value;
 			flowinfo <<= 20;
 			flowinfo |= flowlabel;
 			ip6h->ip6_flow = htonl(flowinfo);
 			if (port) {
 				ip6h->ip6_nxt = IPPROTO_UDP;
 			} else {
 				ip6h->ip6_nxt = IPPROTO_SCTP;
 			}
 			ip6h->ip6_plen = htons((uint16_t)(packet_length - sizeof(struct ip6_hdr)));
 			ip6h->ip6_dst = sin6->sin6_addr;
 
 			/*
 			 * Add SRC address selection here: we can only reuse
 			 * to a limited degree the kame src-addr-sel, since
 			 * we can try their selection but it may not be
 			 * bound.
 			 */
 			memset(&lsa6_tmp, 0, sizeof(lsa6_tmp));
 			lsa6_tmp.sin6_family = AF_INET6;
 			lsa6_tmp.sin6_len = sizeof(lsa6_tmp);
 			lsa6 = &lsa6_tmp;
 			if (net && out_of_asoc_ok == 0) {
 				if (net->ro._s_addr && (net->ro._s_addr->localifa_flags & (SCTP_BEING_DELETED | SCTP_ADDR_IFA_UNUSEABLE))) {
 					sctp_free_ifa(net->ro._s_addr);
 					net->ro._s_addr = NULL;
 					net->src_addr_selected = 0;
 					RO_NHFREE(ro);
 				}
 				if (net->src_addr_selected == 0) {
 					sin6 = (struct sockaddr_in6 *)&net->ro._l_addr;
 					/* KAME hack: embed scopeid */
 					if (sa6_embedscope(sin6, MODULE_GLOBAL(ip6_use_defzone)) != 0) {
 						SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 						sctp_m_freem(m);
 						return (EINVAL);
 					}
 					/* Cache the source address */
 					net->ro._s_addr = sctp_source_address_selection(inp,
 					    stcb,
 					    ro,
 					    net,
 					    0,
 					    vrf_id);
 					(void)sa6_recoverscope(sin6);
 					net->src_addr_selected = 1;
 				}
 				if (net->ro._s_addr == NULL) {
 					SCTPDBG(SCTP_DEBUG_OUTPUT3, "V6:No route to host\n");
 					net->src_addr_selected = 0;
 					sctp_handle_no_route(stcb, net, so_locked);
 					SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 					sctp_m_freem(m);
 					return (EHOSTUNREACH);
 				}
 				lsa6->sin6_addr = net->ro._s_addr->address.sin6.sin6_addr;
 			} else {
 				sin6 = (struct sockaddr_in6 *)&ro->ro_dst;
 				/* KAME hack: embed scopeid */
 				if (sa6_embedscope(sin6, MODULE_GLOBAL(ip6_use_defzone)) != 0) {
 					SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 					sctp_m_freem(m);
 					return (EINVAL);
 				}
 				if (over_addr == NULL) {
 					struct sctp_ifa *_lsrc;
 
 					_lsrc = sctp_source_address_selection(inp, stcb, ro,
 					    net,
 					    out_of_asoc_ok,
 					    vrf_id);
 					if (_lsrc == NULL) {
 						sctp_handle_no_route(stcb, net, so_locked);
 						SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 						sctp_m_freem(m);
 						return (EHOSTUNREACH);
 					}
 					lsa6->sin6_addr = _lsrc->address.sin6.sin6_addr;
 					sctp_free_ifa(_lsrc);
 				} else {
 					lsa6->sin6_addr = over_addr->sin6.sin6_addr;
 					SCTP_RTALLOC(ro, vrf_id, inp->fibnum);
 				}
 				(void)sa6_recoverscope(sin6);
 			}
 			lsa6->sin6_port = inp->sctp_lport;
 
 			if (ro->ro_nh == NULL) {
 				/*
 				 * src addr selection failed to find a route
 				 * (or valid source addr), so we can't get
 				 * there from here!
 				 */
 				sctp_handle_no_route(stcb, net, so_locked);
 				SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 				sctp_m_freem(m);
 				return (EHOSTUNREACH);
 			}
 			/*
 			 * XXX: sa6 may not have a valid sin6_scope_id in
 			 * the non-SCOPEDROUTING case.
 			 */
 			memset(&lsa6_storage, 0, sizeof(lsa6_storage));
 			lsa6_storage.sin6_family = AF_INET6;
 			lsa6_storage.sin6_len = sizeof(lsa6_storage);
 			lsa6_storage.sin6_addr = lsa6->sin6_addr;
 			if ((error = sa6_recoverscope(&lsa6_storage)) != 0) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT3, "recover scope fails error %d\n", error);
 				sctp_m_freem(m);
 				return (error);
 			}
 			/* XXX */
 			lsa6_storage.sin6_addr = lsa6->sin6_addr;
 			lsa6_storage.sin6_port = inp->sctp_lport;
 			lsa6 = &lsa6_storage;
 			ip6h->ip6_src = lsa6->sin6_addr;
 
 			if (port) {
 				if (htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port)) == 0) {
 					sctp_handle_no_route(stcb, net, so_locked);
 					SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EHOSTUNREACH);
 					sctp_m_freem(m);
 					return (EHOSTUNREACH);
 				}
 				udp = (struct udphdr *)((caddr_t)ip6h + sizeof(struct ip6_hdr));
 				udp->uh_sport = htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port));
 				udp->uh_dport = port;
 				udp->uh_ulen = htons((uint16_t)(packet_length - sizeof(struct ip6_hdr)));
 				udp->uh_sum = 0;
 				sctphdr = (struct sctphdr *)((caddr_t)udp + sizeof(struct udphdr));
 			} else {
 				sctphdr = (struct sctphdr *)((caddr_t)ip6h + sizeof(struct ip6_hdr));
 			}
 
 			sctphdr->src_port = src_port;
 			sctphdr->dest_port = dest_port;
 			sctphdr->v_tag = v_tag;
 			sctphdr->checksum = 0;
 
 			/*
 			 * We set the hop limit now since there is a good
 			 * chance that our ro pointer is now filled
 			 */
 			ip6h->ip6_hlim = SCTP_GET_HLIM(inp, ro);
 			ifp = SCTP_GET_IFN_VOID_FROM_ROUTE(ro);
 
 #ifdef SCTP_DEBUG
 			/* Copy to be sure something bad is not happening */
 			sin6->sin6_addr = ip6h->ip6_dst;
 			lsa6->sin6_addr = ip6h->ip6_src;
 #endif
 
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "Calling ipv6 output routine from low level\n");
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "src: ");
 			SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT3, (struct sockaddr *)lsa6);
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "dst: ");
 			SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT3, (struct sockaddr *)sin6);
 			if (net) {
 				sin6 = (struct sockaddr_in6 *)&net->ro._l_addr;
 				/*
 				 * preserve the port and scope for link
 				 * local send
 				 */
 				prev_scope = sin6->sin6_scope_id;
 				prev_port = sin6->sin6_port;
 			}
 
 			if (SCTP_GET_HEADER_FOR_OUTPUT(o_pak)) {
 				/* failed to prepend data, give up */
 				sctp_m_freem(m);
 				SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 				return (ENOMEM);
 			}
 			SCTP_ATTACH_CHAIN(o_pak, m, packet_length);
 			if (port) {
 				sctphdr->checksum = sctp_calculate_cksum(m, sizeof(struct ip6_hdr) + sizeof(struct udphdr));
 				SCTP_STAT_INCR(sctps_sendswcrc);
 				if ((udp->uh_sum = in6_cksum(o_pak, IPPROTO_UDP, sizeof(struct ip6_hdr), packet_length - sizeof(struct ip6_hdr))) == 0) {
 					udp->uh_sum = 0xffff;
 				}
 			} else {
 				m->m_pkthdr.csum_flags = CSUM_SCTP_IPV6;
 				m->m_pkthdr.csum_data = offsetof(struct sctphdr, checksum);
 				SCTP_STAT_INCR(sctps_sendhwcrc);
 			}
 			/* send it out. table id is taken from stcb */
 #ifdef SCTP_PACKET_LOGGING
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LAST_PACKET_TRACING)
 				sctp_packet_log(o_pak);
 #endif
 			SCTP_PROBE5(send, NULL, stcb, ip6h, stcb, sctphdr);
 			SCTP_IP6_OUTPUT(ret, o_pak, (struct route_in6 *)ro, &ifp, inp, vrf_id);
 			if (net) {
 				/* for link local this must be done */
 				sin6->sin6_scope_id = prev_scope;
 				sin6->sin6_port = prev_port;
 			}
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "return from send is %d\n", ret);
 			if (port) {
 				UDPSTAT_INC(udps_opackets);
 			}
 			SCTP_STAT_INCR(sctps_sendpackets);
 			SCTP_STAT_INCR_COUNTER64(sctps_outpackets);
 			if (ret) {
 				SCTP_STAT_INCR(sctps_senderrors);
 			}
 			if (net == NULL) {
 				/* Now if we had a temp route free it */
 				RO_NHFREE(ro);
 			} else {
 				/*
 				 * PMTU check versus smallest asoc MTU goes
 				 * here
 				 */
 				if (ro->ro_nh == NULL) {
 					/* Route was freed */
 					if (net->ro._s_addr &&
 					    net->src_addr_selected) {
 						sctp_free_ifa(net->ro._s_addr);
 						net->ro._s_addr = NULL;
 					}
 					net->src_addr_selected = 0;
 				}
 				if ((ro->ro_nh != NULL) && (net->ro._s_addr) &&
 				    ((net->dest_state & SCTP_ADDR_NO_PMTUD) == 0)) {
 					uint32_t mtu;
 
 					mtu = SCTP_GATHER_MTU_FROM_ROUTE(net->ro._s_addr, &net->ro._l_addr.sa, ro->ro_nh);
 					if (mtu > 0) {
 						if (net->port) {
 							mtu -= sizeof(struct udphdr);
 						}
 						if (mtu < net->mtu) {
 							net->mtu = mtu;
 							if ((stcb != NULL) && (stcb->asoc.smallest_mtu > mtu)) {
 								sctp_pathmtu_adjustment(stcb, mtu, false);
 							}
 						}
 					}
 				} else if (ifp != NULL) {
 					if ((ND_IFINFO(ifp)->linkmtu > 0) &&
 					    (stcb->asoc.smallest_mtu > ND_IFINFO(ifp)->linkmtu)) {
 						sctp_pathmtu_adjustment(stcb, ND_IFINFO(ifp)->linkmtu, false);
 					}
 				}
 			}
 			return (ret);
 		}
 #endif
 	default:
 		SCTPDBG(SCTP_DEBUG_OUTPUT1, "Unknown protocol (TSNH) type %d\n",
 		    ((struct sockaddr *)to)->sa_family);
 		sctp_m_freem(m);
 		SCTP_LTRACE_ERR_RET_PKT(m, inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		return (EFAULT);
 	}
 }
 
 void
 sctp_send_initiate(struct sctp_inpcb *inp, struct sctp_tcb *stcb, int so_locked)
 {
 	struct mbuf *m, *m_last;
 	struct sctp_nets *net;
 	struct sctp_init_chunk *init;
 	struct sctp_supported_addr_param *sup_addr;
 	struct sctp_adaptation_layer_indication *ali;
 	struct sctp_supported_chunk_types_param *pr_supported;
 	struct sctp_paramhdr *ph;
 	int cnt_inits_to = 0;
 	int error;
 	uint16_t num_ext, chunk_len, padding_len, parameter_len;
 
 	/* INIT's always go to the primary (and usually ONLY address) */
 	net = stcb->asoc.primary_destination;
 	if (net == NULL) {
 		net = TAILQ_FIRST(&stcb->asoc.nets);
 		if (net == NULL) {
 			/* TSNH */
 			return;
 		}
 		/* we confirm any address we send an INIT to */
 		net->dest_state &= ~SCTP_ADDR_UNCONFIRMED;
 		(void)sctp_set_primary_addr(stcb, NULL, net);
 	} else {
 		/* we confirm any address we send an INIT to */
 		net->dest_state &= ~SCTP_ADDR_UNCONFIRMED;
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT4, "Sending INIT\n");
 #ifdef INET6
 	if (net->ro._l_addr.sa.sa_family == AF_INET6) {
 		/*
 		 * special hook, if we are sending to link local it will not
 		 * show up in our private address count.
 		 */
 		if (IN6_IS_ADDR_LINKLOCAL(&net->ro._l_addr.sin6.sin6_addr))
 			cnt_inits_to = 1;
 	}
 #endif
 	if (SCTP_OS_TIMER_PENDING(&net->rxt_timer.timer)) {
 		/* This case should not happen */
 		SCTPDBG(SCTP_DEBUG_OUTPUT4, "Sending INIT - failed timer?\n");
 		return;
 	}
 	/* start the INIT timer */
 	sctp_timer_start(SCTP_TIMER_TYPE_INIT, inp, stcb, net);
 
 	m = sctp_get_mbuf_for_msg(MCLBYTES, 1, M_NOWAIT, 1, MT_DATA);
 	if (m == NULL) {
 		/* No memory, INIT timer will re-attempt. */
 		SCTPDBG(SCTP_DEBUG_OUTPUT4, "Sending INIT - mbuf?\n");
 		return;
 	}
 	chunk_len = (uint16_t)sizeof(struct sctp_init_chunk);
 	padding_len = 0;
 	/* Now lets put the chunk header in place */
 	init = mtod(m, struct sctp_init_chunk *);
 	/* now the chunk header */
 	init->ch.chunk_type = SCTP_INITIATION;
 	init->ch.chunk_flags = 0;
 	/* fill in later from mbuf we build */
 	init->ch.chunk_length = 0;
 	/* place in my tag */
 	init->init.initiate_tag = htonl(stcb->asoc.my_vtag);
 	/* set up some of the credits. */
 	init->init.a_rwnd = htonl(max(inp->sctp_socket ? SCTP_SB_LIMIT_RCV(inp->sctp_socket) : 0,
 	    SCTP_MINIMAL_RWND));
 	init->init.num_outbound_streams = htons(stcb->asoc.pre_open_streams);
 	init->init.num_inbound_streams = htons(stcb->asoc.max_inbound_streams);
 	init->init.initial_tsn = htonl(stcb->asoc.init_seq_number);
 
 	/* Adaptation layer indication parameter */
 	if (inp->sctp_ep.adaptation_layer_indicator_provided) {
 		parameter_len = (uint16_t)sizeof(struct sctp_adaptation_layer_indication);
 		ali = (struct sctp_adaptation_layer_indication *)(mtod(m, caddr_t)+chunk_len);
 		ali->ph.param_type = htons(SCTP_ULP_ADAPTATION);
 		ali->ph.param_length = htons(parameter_len);
 		ali->indication = htonl(inp->sctp_ep.adaptation_layer_indicator);
 		chunk_len += parameter_len;
 	}
 
 	/* ECN parameter */
 	if (stcb->asoc.ecn_supported == 1) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_ECN_CAPABLE);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* PR-SCTP supported parameter */
 	if (stcb->asoc.prsctp_supported == 1) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_PRSCTP_SUPPORTED);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* Zero checksum acceptable parameter */
 	if (stcb->asoc.zero_checksum > 0) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_ZERO_CHECKSUM_ACCEPTABLE);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* Add NAT friendly parameter. */
 	if (SCTP_BASE_SYSCTL(sctp_inits_include_nat_friendly)) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_HAS_NAT_SUPPORT);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* And now tell the peer which extensions we support */
 	num_ext = 0;
 	pr_supported = (struct sctp_supported_chunk_types_param *)(mtod(m, caddr_t)+chunk_len);
 	if (stcb->asoc.prsctp_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_FORWARD_CUM_TSN;
 		if (stcb->asoc.idata_supported) {
 			pr_supported->chunk_types[num_ext++] = SCTP_IFORWARD_CUM_TSN;
 		}
 	}
 	if (stcb->asoc.auth_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_AUTHENTICATION;
 	}
 	if (stcb->asoc.asconf_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_ASCONF;
 		pr_supported->chunk_types[num_ext++] = SCTP_ASCONF_ACK;
 	}
 	if (stcb->asoc.reconfig_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_STREAM_RESET;
 	}
 	if (stcb->asoc.idata_supported) {
 		pr_supported->chunk_types[num_ext++] = SCTP_IDATA;
 	}
 	if (stcb->asoc.nrsack_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_NR_SELECTIVE_ACK;
 	}
 	if (stcb->asoc.pktdrop_supported == 1) {
 		pr_supported->chunk_types[num_ext++] = SCTP_PACKET_DROPPED;
 	}
 	if (num_ext > 0) {
 		parameter_len = (uint16_t)sizeof(struct sctp_supported_chunk_types_param) + num_ext;
 		pr_supported->ph.param_type = htons(SCTP_SUPPORTED_CHUNK_EXT);
 		pr_supported->ph.param_length = htons(parameter_len);
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		chunk_len += parameter_len;
 	}
 	/* add authentication parameters */
 	if (stcb->asoc.auth_supported) {
 		/* attach RANDOM parameter, if available */
 		if (stcb->asoc.authinfo.random != NULL) {
 			struct sctp_auth_random *randp;
 
 			if (padding_len > 0) {
 				memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 				chunk_len += padding_len;
 				padding_len = 0;
 			}
 			randp = (struct sctp_auth_random *)(mtod(m, caddr_t)+chunk_len);
 			parameter_len = (uint16_t)sizeof(struct sctp_auth_random) + stcb->asoc.authinfo.random_len;
 			/* random key already contains the header */
 			memcpy(randp, stcb->asoc.authinfo.random->key, parameter_len);
 			padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 			chunk_len += parameter_len;
 		}
 		/* add HMAC_ALGO parameter */
 		if (stcb->asoc.local_hmacs != NULL) {
 			struct sctp_auth_hmac_algo *hmacs;
 
 			if (padding_len > 0) {
 				memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 				chunk_len += padding_len;
 				padding_len = 0;
 			}
 			hmacs = (struct sctp_auth_hmac_algo *)(mtod(m, caddr_t)+chunk_len);
 			parameter_len = (uint16_t)(sizeof(struct sctp_auth_hmac_algo) +
 			    stcb->asoc.local_hmacs->num_algo * sizeof(uint16_t));
 			hmacs->ph.param_type = htons(SCTP_HMAC_LIST);
 			hmacs->ph.param_length = htons(parameter_len);
 			sctp_serialize_hmaclist(stcb->asoc.local_hmacs, (uint8_t *)hmacs->hmac_ids);
 			padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 			chunk_len += parameter_len;
 		}
 		/* add CHUNKS parameter */
 		if (stcb->asoc.local_auth_chunks != NULL) {
 			struct sctp_auth_chunk_list *chunks;
 
 			if (padding_len > 0) {
 				memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 				chunk_len += padding_len;
 				padding_len = 0;
 			}
 			chunks = (struct sctp_auth_chunk_list *)(mtod(m, caddr_t)+chunk_len);
 			parameter_len = (uint16_t)(sizeof(struct sctp_auth_chunk_list) +
 			    sctp_auth_get_chklist_size(stcb->asoc.local_auth_chunks));
 			chunks->ph.param_type = htons(SCTP_CHUNK_LIST);
 			chunks->ph.param_length = htons(parameter_len);
 			sctp_serialize_auth_chunks(stcb->asoc.local_auth_chunks, chunks->chunk_types);
 			padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 			chunk_len += parameter_len;
 		}
 	}
 
 	/* now any cookie time extensions */
 	if (stcb->asoc.cookie_preserve_req > 0) {
 		struct sctp_cookie_perserve_param *cookie_preserve;
 
 		if (padding_len > 0) {
 			memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 			chunk_len += padding_len;
 			padding_len = 0;
 		}
 		parameter_len = (uint16_t)sizeof(struct sctp_cookie_perserve_param);
 		cookie_preserve = (struct sctp_cookie_perserve_param *)(mtod(m, caddr_t)+chunk_len);
 		cookie_preserve->ph.param_type = htons(SCTP_COOKIE_PRESERVE);
 		cookie_preserve->ph.param_length = htons(parameter_len);
 		cookie_preserve->time = htonl(stcb->asoc.cookie_preserve_req);
 		stcb->asoc.cookie_preserve_req = 0;
 		chunk_len += parameter_len;
 	}
 
 	if (stcb->asoc.scope.ipv4_addr_legal || stcb->asoc.scope.ipv6_addr_legal) {
 		uint8_t i;
 
 		if (padding_len > 0) {
 			memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 			chunk_len += padding_len;
 			padding_len = 0;
 		}
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		if (stcb->asoc.scope.ipv4_addr_legal) {
 			parameter_len += (uint16_t)sizeof(uint16_t);
 		}
 		if (stcb->asoc.scope.ipv6_addr_legal) {
 			parameter_len += (uint16_t)sizeof(uint16_t);
 		}
 		sup_addr = (struct sctp_supported_addr_param *)(mtod(m, caddr_t)+chunk_len);
 		sup_addr->ph.param_type = htons(SCTP_SUPPORTED_ADDRTYPE);
 		sup_addr->ph.param_length = htons(parameter_len);
 		i = 0;
 		if (stcb->asoc.scope.ipv4_addr_legal) {
 			sup_addr->addr_type[i++] = htons(SCTP_IPV4_ADDRESS);
 		}
 		if (stcb->asoc.scope.ipv6_addr_legal) {
 			sup_addr->addr_type[i++] = htons(SCTP_IPV6_ADDRESS);
 		}
 		padding_len = 4 - 2 * i;
 		chunk_len += parameter_len;
 	}
 
 	SCTP_BUF_LEN(m) = chunk_len;
 	/* now the addresses */
 	/*
 	 * To optimize this we could put the scoping stuff into a structure
 	 * and remove the individual uint8's from the assoc structure. Then
 	 * we could just sifa in the address within the stcb. But for now
 	 * this is a quick hack to get the address stuff teased apart.
 	 */
 	m_last = sctp_add_addresses_to_i_ia(inp, stcb, &stcb->asoc.scope,
 	    m, cnt_inits_to,
 	    &padding_len, &chunk_len);
 
 	init->ch.chunk_length = htons(chunk_len);
 	if (padding_len > 0) {
 		if (sctp_add_pad_tombuf(m_last, padding_len) == NULL) {
 			sctp_m_freem(m);
 			return;
 		}
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT4, "Sending INIT - calls lowlevel_output\n");
 	if ((error = sctp_lowlevel_chunk_output(inp, stcb, net,
 	    (struct sockaddr *)&net->ro._l_addr,
 	    m, 0, NULL, 0, 0, 0, 0,
 	    inp->sctp_lport, stcb->rport, htonl(0),
 	    net->port, NULL,
 	    0, 0,
 	    false, so_locked))) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT4, "Gak send error %d\n", error);
 		if (error == ENOBUFS) {
 			stcb->asoc.ifp_had_enobuf = 1;
 			SCTP_STAT_INCR(sctps_lowlevelerr);
 		}
 	} else {
 		stcb->asoc.ifp_had_enobuf = 0;
 	}
 	SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 	(void)SCTP_GETTIME_TIMEVAL(&net->last_sent_time);
 }
 
 struct mbuf *
 sctp_arethere_unrecognized_parameters(struct mbuf *in_initpkt,
     int param_offset, int *abort_processing,
     struct sctp_chunkhdr *cp,
     int *nat_friendly,
     int *cookie_found)
 {
 	/*
 	 * Given a mbuf containing an INIT or INIT-ACK with the param_offset
 	 * being equal to the beginning of the params i.e. (iphlen +
 	 * sizeof(struct sctp_init_msg) parse through the parameters to the
 	 * end of the mbuf verifying that all parameters are known.
 	 *
 	 * For unknown parameters build and return a mbuf with
 	 * UNRECOGNIZED_PARAMETER errors. If the flags indicate to stop
 	 * processing this chunk stop, and set *abort_processing to 1.
 	 *
 	 * By having param_offset be pre-set to where parameters begin it is
 	 * hoped that this routine may be reused in the future by new
 	 * features.
 	 */
 	struct sctp_paramhdr *phdr, params;
 
 	struct mbuf *mat, *m_tmp, *op_err, *op_err_last;
 	int at, limit, pad_needed;
 	uint16_t ptype, plen, padded_size;
 
 	*abort_processing = 0;
 	if (cookie_found != NULL) {
 		*cookie_found = 0;
 	}
 	mat = in_initpkt;
 	limit = ntohs(cp->chunk_length) - sizeof(struct sctp_init_chunk);
 	at = param_offset;
 	op_err = NULL;
 	op_err_last = NULL;
 	pad_needed = 0;
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "Check for unrecognized param's\n");
 	phdr = sctp_get_next_param(mat, at, &params, sizeof(params));
 	while ((phdr != NULL) && ((size_t)limit >= sizeof(struct sctp_paramhdr))) {
 		ptype = ntohs(phdr->param_type);
 		plen = ntohs(phdr->param_length);
 		if ((plen > limit) || (plen < sizeof(struct sctp_paramhdr))) {
 			/* wacked parameter */
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error %d\n", plen);
 			goto invalid_size;
 		}
 		limit -= SCTP_SIZE32(plen);
 		/*-
 		 * All parameters for all chunks that we know/understand are
 		 * listed here. We process them other places and make
 		 * appropriate stop actions per the upper bits. However this
 		 * is the generic routine processor's can call to get back
 		 * an operr.. to either incorporate (init-ack) or send.
 		 */
 		padded_size = SCTP_SIZE32(plen);
 		switch (ptype) {
 			/* Param's with variable size */
 		case SCTP_HEARTBEAT_INFO:
 		case SCTP_UNRECOG_PARAM:
 		case SCTP_ERROR_CAUSE_IND:
 			/* ok skip fwd */
 			at += padded_size;
 			break;
 		case SCTP_STATE_COOKIE:
 			if (cookie_found != NULL) {
 				*cookie_found = 1;
 			}
 			at += padded_size;
 			break;
 			/* Param's with variable size within a range */
 		case SCTP_CHUNK_LIST:
 		case SCTP_SUPPORTED_CHUNK_EXT:
 			if (padded_size > (sizeof(struct sctp_supported_chunk_types_param) + (sizeof(uint8_t) * SCTP_MAX_SUPPORTED_EXT))) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error chklist %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_SUPPORTED_ADDRTYPE:
 			if (padded_size > SCTP_MAX_ADDR_PARAMS_SIZE) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error supaddrtype %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_RANDOM:
 			if (padded_size > (sizeof(struct sctp_auth_random) + SCTP_RANDOM_MAX_SIZE)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error random %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_SET_PRIM_ADDR:
 		case SCTP_DEL_IP_ADDRESS:
 		case SCTP_ADD_IP_ADDRESS:
 			if ((padded_size != sizeof(struct sctp_asconf_addrv4_param)) &&
 			    (padded_size != sizeof(struct sctp_asconf_addr_param))) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error setprim %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 			/* Param's with a fixed size */
 		case SCTP_IPV4_ADDRESS:
 			if (padded_size != sizeof(struct sctp_ipv4addr_param)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error ipv4 addr %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_IPV6_ADDRESS:
 			if (padded_size != sizeof(struct sctp_ipv6addr_param)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error ipv6 addr %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_COOKIE_PRESERVE:
 			if (padded_size != sizeof(struct sctp_cookie_perserve_param)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error cookie-preserve %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_HAS_NAT_SUPPORT:
 			*nat_friendly = 1;
-			/* fall through */
+			/* FALLTHROUGH */
 		case SCTP_PRSCTP_SUPPORTED:
 			if (padded_size != sizeof(struct sctp_paramhdr)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error prsctp/nat support %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_ECN_CAPABLE:
 			if (padded_size != sizeof(struct sctp_paramhdr)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error ecn %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_ULP_ADAPTATION:
 			if (padded_size != sizeof(struct sctp_adaptation_layer_indication)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error adapatation %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_SUCCESS_REPORT:
 			if (padded_size != sizeof(struct sctp_asconf_paramhdr)) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Invalid size - error success %d\n", plen);
 				goto invalid_size;
 			}
 			at += padded_size;
 			break;
 		case SCTP_HOSTNAME_ADDRESS:
 			{
 				/* Hostname parameters are deprecated. */
 				struct sctp_gen_error_cause *cause;
 				int l_len;
 
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "Can't handle hostname addresses.. abort processing\n");
 				*abort_processing = 1;
 				sctp_m_freem(op_err);
 				op_err = NULL;
 				op_err_last = NULL;
 #ifdef INET6
 				l_len = SCTP_MIN_OVERHEAD;
 #else
 				l_len = SCTP_MIN_V4_OVERHEAD;
 #endif
 				l_len += sizeof(struct sctp_chunkhdr);
 				l_len += sizeof(struct sctp_gen_error_cause);
 				op_err = sctp_get_mbuf_for_msg(l_len, 0, M_NOWAIT, 1, MT_DATA);
 				if (op_err != NULL) {
 					/*
 					 * Pre-reserve space for IP, SCTP,
 					 * and chunk header.
 					 */
 #ifdef INET6
 					SCTP_BUF_RESV_UF(op_err, sizeof(struct ip6_hdr));
 #else
 					SCTP_BUF_RESV_UF(op_err, sizeof(struct ip));
 #endif
 					SCTP_BUF_RESV_UF(op_err, sizeof(struct sctphdr));
 					SCTP_BUF_RESV_UF(op_err, sizeof(struct sctp_chunkhdr));
 					SCTP_BUF_LEN(op_err) = sizeof(struct sctp_gen_error_cause);
 					cause = mtod(op_err, struct sctp_gen_error_cause *);
 					cause->code = htons(SCTP_CAUSE_UNRESOLVABLE_ADDR);
 					cause->length = htons((uint16_t)(sizeof(struct sctp_gen_error_cause) + plen));
 					SCTP_BUF_NEXT(op_err) = SCTP_M_COPYM(mat, at, plen, M_NOWAIT);
 					if (SCTP_BUF_NEXT(op_err) == NULL) {
 						sctp_m_freem(op_err);
 						op_err = NULL;
 						op_err_last = NULL;
 					}
 				}
 				return (op_err);
 			}
 		default:
 			/*
 			 * we do not recognize the parameter figure out what
 			 * we do.
 			 */
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "Hit default param %x\n", ptype);
 			if ((ptype & 0x4000) == 0x4000) {
 				/* Report bit is set?? */
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "report op err\n");
 				if (op_err == NULL) {
 					int l_len;
 
 					/* Ok need to try to get an mbuf */
 #ifdef INET6
 					l_len = SCTP_MIN_OVERHEAD;
 #else
 					l_len = SCTP_MIN_V4_OVERHEAD;
 #endif
 					l_len += sizeof(struct sctp_chunkhdr);
 					l_len += sizeof(struct sctp_paramhdr);
 					op_err = sctp_get_mbuf_for_msg(l_len, 0, M_NOWAIT, 1, MT_DATA);
 					if (op_err) {
 						SCTP_BUF_LEN(op_err) = 0;
 #ifdef INET6
 						SCTP_BUF_RESV_UF(op_err, sizeof(struct ip6_hdr));
 #else
 						SCTP_BUF_RESV_UF(op_err, sizeof(struct ip));
 #endif
 						SCTP_BUF_RESV_UF(op_err, sizeof(struct sctphdr));
 						SCTP_BUF_RESV_UF(op_err, sizeof(struct sctp_chunkhdr));
 						op_err_last = op_err;
 					}
 				}
 				if (op_err != NULL) {
 					/* If we have space */
 					struct sctp_paramhdr *param;
 
 					if (pad_needed > 0) {
 						op_err_last = sctp_add_pad_tombuf(op_err_last, pad_needed);
 					}
 					if (op_err_last == NULL) {
 						sctp_m_freem(op_err);
 						op_err = NULL;
 						op_err_last = NULL;
 						goto more_processing;
 					}
 					if (M_TRAILINGSPACE(op_err_last) < (int)sizeof(struct sctp_paramhdr)) {
 						m_tmp = sctp_get_mbuf_for_msg(sizeof(struct sctp_paramhdr), 0, M_NOWAIT, 1, MT_DATA);
 						if (m_tmp == NULL) {
 							sctp_m_freem(op_err);
 							op_err = NULL;
 							op_err_last = NULL;
 							goto more_processing;
 						}
 						SCTP_BUF_LEN(m_tmp) = 0;
 						SCTP_BUF_NEXT(m_tmp) = NULL;
 						SCTP_BUF_NEXT(op_err_last) = m_tmp;
 						op_err_last = m_tmp;
 					}
 					param = (struct sctp_paramhdr *)(mtod(op_err_last, caddr_t)+SCTP_BUF_LEN(op_err_last));
 					param->param_type = htons(SCTP_UNRECOG_PARAM);
 					param->param_length = htons((uint16_t)sizeof(struct sctp_paramhdr) + plen);
 					SCTP_BUF_LEN(op_err_last) += sizeof(struct sctp_paramhdr);
 					SCTP_BUF_NEXT(op_err_last) = SCTP_M_COPYM(mat, at, plen, M_NOWAIT);
 					if (SCTP_BUF_NEXT(op_err_last) == NULL) {
 						sctp_m_freem(op_err);
 						op_err = NULL;
 						op_err_last = NULL;
 						goto more_processing;
 					} else {
 						while (SCTP_BUF_NEXT(op_err_last) != NULL) {
 							op_err_last = SCTP_BUF_NEXT(op_err_last);
 						}
 					}
 					if (plen % 4 != 0) {
 						pad_needed = 4 - (plen % 4);
 					} else {
 						pad_needed = 0;
 					}
 				}
 			}
 	more_processing:
 			if ((ptype & 0x8000) == 0x0000) {
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "stop proc\n");
 				return (op_err);
 			} else {
 				/* skip this chunk and continue processing */
 				SCTPDBG(SCTP_DEBUG_OUTPUT1, "move on\n");
 				at += SCTP_SIZE32(plen);
 			}
 			break;
 		}
 		phdr = sctp_get_next_param(mat, at, &params, sizeof(params));
 	}
 	return (op_err);
 invalid_size:
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "abort flag set\n");
 	*abort_processing = 1;
 	sctp_m_freem(op_err);
 	op_err = NULL;
 	op_err_last = NULL;
 	if (phdr != NULL) {
 		struct sctp_paramhdr *param;
 		int l_len;
 #ifdef INET6
 		l_len = SCTP_MIN_OVERHEAD;
 #else
 		l_len = SCTP_MIN_V4_OVERHEAD;
 #endif
 		l_len += sizeof(struct sctp_chunkhdr);
 		l_len += (2 * sizeof(struct sctp_paramhdr));
 		op_err = sctp_get_mbuf_for_msg(l_len, 0, M_NOWAIT, 1, MT_DATA);
 		if (op_err) {
 			SCTP_BUF_LEN(op_err) = 0;
 #ifdef INET6
 			SCTP_BUF_RESV_UF(op_err, sizeof(struct ip6_hdr));
 #else
 			SCTP_BUF_RESV_UF(op_err, sizeof(struct ip));
 #endif
 			SCTP_BUF_RESV_UF(op_err, sizeof(struct sctphdr));
 			SCTP_BUF_RESV_UF(op_err, sizeof(struct sctp_chunkhdr));
 			SCTP_BUF_LEN(op_err) = 2 * sizeof(struct sctp_paramhdr);
 			param = mtod(op_err, struct sctp_paramhdr *);
 			param->param_type = htons(SCTP_CAUSE_PROTOCOL_VIOLATION);
 			param->param_length = htons(2 * sizeof(struct sctp_paramhdr));
 			param++;
 			param->param_type = htons(ptype);
 			param->param_length = htons(plen);
 		}
 	}
 	return (op_err);
 }
 
 /*
  * Given a INIT chunk, look through the parameters to verify that there
  * are no new addresses.
  * Return true, if there is a new address or there is a problem parsing
    the parameters. Provide an optional error cause used when sending an ABORT.
  * Return false, if there are no new addresses and there is no problem in
    parameter processing.
  */
 static bool
 sctp_are_there_new_addresses(struct sctp_association *asoc,
     struct mbuf *in_initpkt, int offset, int limit, struct sockaddr *src,
     struct mbuf **op_err)
 {
 	struct sockaddr *sa_touse;
 	struct sockaddr *sa;
 	struct sctp_paramhdr *phdr, params;
 	struct sctp_nets *net;
 #ifdef INET
 	struct sockaddr_in sin4, *sa4;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 sin6, *sa6;
 #endif
 	uint16_t ptype, plen;
 	bool fnd, check_src;
 
 	*op_err = NULL;
 #ifdef INET
 	memset(&sin4, 0, sizeof(sin4));
 	sin4.sin_family = AF_INET;
 	sin4.sin_len = sizeof(sin4);
 #endif
 #ifdef INET6
 	memset(&sin6, 0, sizeof(sin6));
 	sin6.sin6_family = AF_INET6;
 	sin6.sin6_len = sizeof(sin6);
 #endif
 	/* First what about the src address of the pkt ? */
 	check_src = false;
 	switch (src->sa_family) {
 #ifdef INET
 	case AF_INET:
 		if (asoc->scope.ipv4_addr_legal) {
 			check_src = true;
 		}
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		if (asoc->scope.ipv6_addr_legal) {
 			check_src = true;
 		}
 		break;
 #endif
 	default:
 		/* TSNH */
 		break;
 	}
 	if (check_src) {
 		fnd = false;
 		TAILQ_FOREACH(net, &asoc->nets, sctp_next) {
 			sa = (struct sockaddr *)&net->ro._l_addr;
 			if (sa->sa_family == src->sa_family) {
 #ifdef INET
 				if (sa->sa_family == AF_INET) {
 					struct sockaddr_in *src4;
 
 					sa4 = (struct sockaddr_in *)sa;
 					src4 = (struct sockaddr_in *)src;
 					if (sa4->sin_addr.s_addr == src4->sin_addr.s_addr) {
 						fnd = true;
 						break;
 					}
 				}
 #endif
 #ifdef INET6
 				if (sa->sa_family == AF_INET6) {
 					struct sockaddr_in6 *src6;
 
 					sa6 = (struct sockaddr_in6 *)sa;
 					src6 = (struct sockaddr_in6 *)src;
 					if (SCTP6_ARE_ADDR_EQUAL(sa6, src6)) {
 						fnd = true;
 						break;
 					}
 				}
 #endif
 			}
 		}
 		if (!fnd) {
 			/*
 			 * If sending an ABORT in case of an additional
 			 * address, don't use the new address error cause.
 			 * This looks no different than if no listener was
 			 * present.
 			 */
 			*op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code), "Address added");
 			return (true);
 		}
 	}
 	/* Ok so far lets munge through the rest of the packet */
 	offset += sizeof(struct sctp_init_chunk);
 	phdr = sctp_get_next_param(in_initpkt, offset, &params, sizeof(params));
 	while (phdr) {
 		sa_touse = NULL;
 		ptype = ntohs(phdr->param_type);
 		plen = ntohs(phdr->param_length);
 		if (offset + plen > limit) {
 			*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "Partial parameter");
 			return (true);
 		}
 		if (plen < sizeof(struct sctp_paramhdr)) {
 			*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "Parameter length too small");
 			return (true);
 		}
 		switch (ptype) {
 #ifdef INET
 		case SCTP_IPV4_ADDRESS:
 			{
 				struct sctp_ipv4addr_param *p4, p4_buf;
 
 				if (plen != sizeof(struct sctp_ipv4addr_param)) {
 					*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "Parameter length illegal");
 					return (true);
 				}
 				phdr = sctp_get_next_param(in_initpkt, offset,
 				    (struct sctp_paramhdr *)&p4_buf, sizeof(p4_buf));
 				if (phdr == NULL) {
 					*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "");
 					return (true);
 				}
 				if (asoc->scope.ipv4_addr_legal) {
 					p4 = (struct sctp_ipv4addr_param *)phdr;
 					sin4.sin_addr.s_addr = p4->addr;
 					sa_touse = (struct sockaddr *)&sin4;
 				}
 				break;
 			}
 #endif
 #ifdef INET6
 		case SCTP_IPV6_ADDRESS:
 			{
 				struct sctp_ipv6addr_param *p6, p6_buf;
 
 				if (plen != sizeof(struct sctp_ipv6addr_param)) {
 					*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "Parameter length illegal");
 					return (true);
 				}
 				phdr = sctp_get_next_param(in_initpkt, offset,
 				    (struct sctp_paramhdr *)&p6_buf, sizeof(p6_buf));
 				if (phdr == NULL) {
 					*op_err = sctp_generate_cause(SCTP_CAUSE_PROTOCOL_VIOLATION, "");
 					return (true);
 				}
 				if (asoc->scope.ipv6_addr_legal) {
 					p6 = (struct sctp_ipv6addr_param *)phdr;
 					memcpy((caddr_t)&sin6.sin6_addr, p6->addr,
 					    sizeof(p6->addr));
 					sa_touse = (struct sockaddr *)&sin6;
 				}
 				break;
 			}
 #endif
 		default:
 			sa_touse = NULL;
 			break;
 		}
 		if (sa_touse) {
 			/* ok, sa_touse points to one to check */
 			fnd = false;
 			TAILQ_FOREACH(net, &asoc->nets, sctp_next) {
 				sa = (struct sockaddr *)&net->ro._l_addr;
 				if (sa->sa_family != sa_touse->sa_family) {
 					continue;
 				}
 #ifdef INET
 				if (sa->sa_family == AF_INET) {
 					sa4 = (struct sockaddr_in *)sa;
 					if (sa4->sin_addr.s_addr ==
 					    sin4.sin_addr.s_addr) {
 						fnd = true;
 						break;
 					}
 				}
 #endif
 #ifdef INET6
 				if (sa->sa_family == AF_INET6) {
 					sa6 = (struct sockaddr_in6 *)sa;
 					if (SCTP6_ARE_ADDR_EQUAL(
 					    sa6, &sin6)) {
 						fnd = true;
 						break;
 					}
 				}
 #endif
 			}
 			if (!fnd) {
 				/*
 				 * If sending an ABORT in case of an
 				 * additional address, don't use the new
 				 * address error cause. This looks no
 				 * different than if no listener was
 				 * present.
 				 */
 				*op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code), "Address added");
 				return (true);
 			}
 		}
 		offset += SCTP_SIZE32(plen);
 		if (offset >= limit) {
 			break;
 		}
 		phdr = sctp_get_next_param(in_initpkt, offset, &params, sizeof(params));
 	}
 	return (false);
 }
 
 /*
  * Given a MBUF chain that was sent into us containing an INIT. Build a
  * INIT-ACK with COOKIE and send back. We assume that the in_initpkt has done
  * a pullup to include IPv6/4header, SCTP header and initial part of INIT
  * message (i.e. the struct sctp_init_msg).
  */
 void
 sctp_send_initiate_ack(struct sctp_inpcb *inp, struct sctp_tcb *stcb,
     struct sctp_nets *src_net, struct mbuf *init_pkt,
     int iphlen, int offset,
     struct sockaddr *src, struct sockaddr *dst,
     struct sctphdr *sh, struct sctp_init_chunk *init_chk,
     uint8_t mflowtype, uint32_t mflowid,
     uint32_t vrf_id, uint16_t port)
 {
 	struct sctp_association *asoc;
 	struct mbuf *m, *m_tmp, *m_last, *m_cookie, *op_err;
 	struct sctp_init_ack_chunk *initack;
 	struct sctp_adaptation_layer_indication *ali;
 	struct sctp_supported_chunk_types_param *pr_supported;
 	struct sctp_paramhdr *ph;
 	union sctp_sockstore *over_addr;
 	struct sctp_scoping scp;
 	struct timeval now;
 #ifdef INET
 	struct sockaddr_in *dst4 = (struct sockaddr_in *)dst;
 	struct sockaddr_in *src4 = (struct sockaddr_in *)src;
 	struct sockaddr_in *sin;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 *dst6 = (struct sockaddr_in6 *)dst;
 	struct sockaddr_in6 *src6 = (struct sockaddr_in6 *)src;
 	struct sockaddr_in6 *sin6;
 #endif
 	struct sockaddr *to;
 	struct sctp_state_cookie stc;
 	struct sctp_nets *net = NULL;
 	uint8_t *signature = NULL;
 	int cnt_inits_to = 0;
 	uint16_t his_limit, i_want;
 	int abort_flag;
 	int nat_friendly = 0;
 	int error;
 	struct socket *so;
 	uint16_t num_ext, chunk_len, padding_len, parameter_len;
 
 	if (stcb) {
 		asoc = &stcb->asoc;
 	} else {
 		asoc = NULL;
 	}
 	if ((asoc != NULL) &&
 	    (SCTP_GET_STATE(stcb) != SCTP_STATE_COOKIE_WAIT)) {
 		if (sctp_are_there_new_addresses(asoc, init_pkt, offset, offset + ntohs(init_chk->ch.chunk_length), src, &op_err)) {
 			/*
 			 * new addresses, out of here in non-cookie-wait
 			 * states
 			 */
 			sctp_send_abort(init_pkt, iphlen, src, dst, sh, 0, op_err,
 			    mflowtype, mflowid, inp->fibnum,
 			    vrf_id, port);
 			return;
 		}
 		if (src_net != NULL && (src_net->port != port)) {
 			/*
 			 * change of remote encapsulation port, out of here
 			 * in non-cookie-wait states
 			 *
 			 * Send an ABORT, without an specific error cause.
 			 * This looks no different than if no listener was
 			 * present.
 			 */
 			op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
 			    "Remote encapsulation port changed");
 			sctp_send_abort(init_pkt, iphlen, src, dst, sh, 0, op_err,
 			    mflowtype, mflowid, inp->fibnum,
 			    vrf_id, port);
 			return;
 		}
 	}
 	abort_flag = 0;
 	op_err = sctp_arethere_unrecognized_parameters(init_pkt,
 	    (offset + sizeof(struct sctp_init_chunk)),
 	    &abort_flag,
 	    (struct sctp_chunkhdr *)init_chk,
 	    &nat_friendly, NULL);
 	if (abort_flag) {
 do_a_abort:
 		if (op_err == NULL) {
 			char msg[SCTP_DIAG_INFO_LEN];
 
 			SCTP_SNPRINTF(msg, sizeof(msg), "%s:%d at %s", __FILE__, __LINE__, __func__);
 			op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
 			    msg);
 		}
 		sctp_send_abort(init_pkt, iphlen, src, dst, sh,
 		    init_chk->init.initiate_tag, op_err,
 		    mflowtype, mflowid, inp->fibnum,
 		    vrf_id, port);
 		return;
 	}
 	m = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (m == NULL) {
 		/* No memory, INIT timer will re-attempt. */
 		sctp_m_freem(op_err);
 		return;
 	}
 	chunk_len = (uint16_t)sizeof(struct sctp_init_ack_chunk);
 	padding_len = 0;
 
 	/*
 	 * We might not overwrite the identification[] completely and on
 	 * some platforms time_entered will contain some padding. Therefore
 	 * zero out the cookie to avoid putting uninitialized memory on the
 	 * wire.
 	 */
 	memset(&stc, 0, sizeof(struct sctp_state_cookie));
 
 	/* the time I built cookie */
 	(void)SCTP_GETTIME_TIMEVAL(&now);
 	stc.time_entered.tv_sec = now.tv_sec;
 	stc.time_entered.tv_usec = now.tv_usec;
 
 	/* populate any tie tags */
 	if (asoc != NULL) {
 		/* unlock before tag selections */
 		stc.tie_tag_my_vtag = asoc->my_vtag_nonce;
 		stc.tie_tag_peer_vtag = asoc->peer_vtag_nonce;
 		stc.cookie_life = asoc->cookie_life;
 		net = asoc->primary_destination;
 	} else {
 		stc.tie_tag_my_vtag = 0;
 		stc.tie_tag_peer_vtag = 0;
 		/* life I will award this cookie */
 		stc.cookie_life = inp->sctp_ep.def_cookie_life;
 	}
 
 	/* copy in the ports for later check */
 	stc.myport = sh->dest_port;
 	stc.peerport = sh->src_port;
 
 	/*
 	 * If we wanted to honor cookie life extensions, we would add to
 	 * stc.cookie_life. For now we should NOT honor any extension
 	 */
 	stc.site_scope = stc.local_scope = stc.loopback_scope = 0;
 	if (inp->sctp_flags & SCTP_PCB_FLAGS_BOUND_V6) {
 		stc.ipv6_addr_legal = 1;
 		if (SCTP_IPV6_V6ONLY(inp)) {
 			stc.ipv4_addr_legal = 0;
 		} else {
 			stc.ipv4_addr_legal = 1;
 		}
 	} else {
 		stc.ipv6_addr_legal = 0;
 		stc.ipv4_addr_legal = 1;
 	}
 	stc.ipv4_scope = 0;
 	if (net == NULL) {
 		to = src;
 		switch (dst->sa_family) {
 #ifdef INET
 		case AF_INET:
 			{
 				/* lookup address */
 				stc.address[0] = src4->sin_addr.s_addr;
 				stc.address[1] = 0;
 				stc.address[2] = 0;
 				stc.address[3] = 0;
 				stc.addr_type = SCTP_IPV4_ADDRESS;
 				/* local from address */
 				stc.laddress[0] = dst4->sin_addr.s_addr;
 				stc.laddress[1] = 0;
 				stc.laddress[2] = 0;
 				stc.laddress[3] = 0;
 				stc.laddr_type = SCTP_IPV4_ADDRESS;
 				/* scope_id is only for v6 */
 				stc.scope_id = 0;
 				if ((IN4_ISPRIVATE_ADDRESS(&src4->sin_addr)) ||
 				    (IN4_ISPRIVATE_ADDRESS(&dst4->sin_addr))) {
 					stc.ipv4_scope = 1;
 				}
 				/* Must use the address in this case */
 				if (sctp_is_address_on_local_host(src, vrf_id)) {
 					stc.loopback_scope = 1;
 					stc.ipv4_scope = 1;
 					stc.site_scope = 1;
 					stc.local_scope = 0;
 				}
 				break;
 			}
 #endif
 #ifdef INET6
 		case AF_INET6:
 			{
 				stc.addr_type = SCTP_IPV6_ADDRESS;
 				memcpy(&stc.address, &src6->sin6_addr, sizeof(struct in6_addr));
 				stc.scope_id = ntohs(in6_getscope(&src6->sin6_addr));
 				if (sctp_is_address_on_local_host(src, vrf_id)) {
 					stc.loopback_scope = 1;
 					stc.local_scope = 0;
 					stc.site_scope = 1;
 					stc.ipv4_scope = 1;
 				} else if (IN6_IS_ADDR_LINKLOCAL(&src6->sin6_addr) ||
 				    IN6_IS_ADDR_LINKLOCAL(&dst6->sin6_addr)) {
 					/*
 					 * If the new destination or source
 					 * is a LINK_LOCAL we must have
 					 * common both site and local scope.
 					 * Don't set local scope though
 					 * since we must depend on the
 					 * source to be added implicitly. We
 					 * cannot assure just because we
 					 * share one link that all links are
 					 * common.
 					 */
 					stc.local_scope = 0;
 					stc.site_scope = 1;
 					stc.ipv4_scope = 1;
 					/*
 					 * we start counting for the private
 					 * address stuff at 1. since the
 					 * link local we source from won't
 					 * show up in our scoped count.
 					 */
 					cnt_inits_to = 1;
 					/*
 					 * pull out the scope_id from
 					 * incoming pkt
 					 */
 				} else if (IN6_IS_ADDR_SITELOCAL(&src6->sin6_addr) ||
 				    IN6_IS_ADDR_SITELOCAL(&dst6->sin6_addr)) {
 					/*
 					 * If the new destination or source
 					 * is SITE_LOCAL then we must have
 					 * site scope in common.
 					 */
 					stc.site_scope = 1;
 				}
 				memcpy(&stc.laddress, &dst6->sin6_addr, sizeof(struct in6_addr));
 				stc.laddr_type = SCTP_IPV6_ADDRESS;
 				break;
 			}
 #endif
 		default:
 			/* TSNH */
 			goto do_a_abort;
 			break;
 		}
 	} else {
 		/* set the scope per the existing tcb */
 
 #ifdef INET6
 		struct sctp_nets *lnet;
 #endif
 
 		stc.loopback_scope = asoc->scope.loopback_scope;
 		stc.ipv4_scope = asoc->scope.ipv4_local_scope;
 		stc.site_scope = asoc->scope.site_scope;
 		stc.local_scope = asoc->scope.local_scope;
 #ifdef INET6
 		/* Why do we not consider IPv4 LL addresses? */
 		TAILQ_FOREACH(lnet, &asoc->nets, sctp_next) {
 			if (lnet->ro._l_addr.sin6.sin6_family == AF_INET6) {
 				if (IN6_IS_ADDR_LINKLOCAL(&lnet->ro._l_addr.sin6.sin6_addr)) {
 					/*
 					 * if we have a LL address, start
 					 * counting at 1.
 					 */
 					cnt_inits_to = 1;
 				}
 			}
 		}
 #endif
 		/* use the net pointer */
 		to = (struct sockaddr *)&net->ro._l_addr;
 		switch (to->sa_family) {
 #ifdef INET
 		case AF_INET:
 			sin = (struct sockaddr_in *)to;
 			stc.address[0] = sin->sin_addr.s_addr;
 			stc.address[1] = 0;
 			stc.address[2] = 0;
 			stc.address[3] = 0;
 			stc.addr_type = SCTP_IPV4_ADDRESS;
 			if (net->src_addr_selected == 0) {
 				/*
 				 * strange case here, the INIT should have
 				 * did the selection.
 				 */
 				net->ro._s_addr = sctp_source_address_selection(inp,
 				    stcb, (sctp_route_t *)&net->ro,
 				    net, 0, vrf_id);
 				if (net->ro._s_addr == NULL) {
 					sctp_m_freem(op_err);
 					sctp_m_freem(m);
 					return;
 				}
 
 				net->src_addr_selected = 1;
 			}
 			stc.laddress[0] = net->ro._s_addr->address.sin.sin_addr.s_addr;
 			stc.laddress[1] = 0;
 			stc.laddress[2] = 0;
 			stc.laddress[3] = 0;
 			stc.laddr_type = SCTP_IPV4_ADDRESS;
 			/* scope_id is only for v6 */
 			stc.scope_id = 0;
 			break;
 #endif
 #ifdef INET6
 		case AF_INET6:
 			sin6 = (struct sockaddr_in6 *)to;
 			memcpy(&stc.address, &sin6->sin6_addr,
 			    sizeof(struct in6_addr));
 			stc.addr_type = SCTP_IPV6_ADDRESS;
 			stc.scope_id = sin6->sin6_scope_id;
 			if (net->src_addr_selected == 0) {
 				/*
 				 * strange case here, the INIT should have
 				 * done the selection.
 				 */
 				net->ro._s_addr = sctp_source_address_selection(inp,
 				    stcb, (sctp_route_t *)&net->ro,
 				    net, 0, vrf_id);
 				if (net->ro._s_addr == NULL) {
 					sctp_m_freem(op_err);
 					sctp_m_freem(m);
 					return;
 				}
 
 				net->src_addr_selected = 1;
 			}
 			memcpy(&stc.laddress, &net->ro._s_addr->address.sin6.sin6_addr,
 			    sizeof(struct in6_addr));
 			stc.laddr_type = SCTP_IPV6_ADDRESS;
 			break;
 #endif
 		}
 	}
 	if (asoc != NULL) {
 		stc.zero_checksum = asoc->zero_checksum > 0 ? 1 : 0;
 	} else {
 		stc.zero_checksum = inp->zero_checksum;
 	}
 	/* Now lets put the SCTP header in place */
 	initack = mtod(m, struct sctp_init_ack_chunk *);
 	/* Save it off for quick ref */
 	stc.peers_vtag = ntohl(init_chk->init.initiate_tag);
 	/* who are we */
 	memcpy(stc.identification, SCTP_VERSION_STRING,
 	    min(strlen(SCTP_VERSION_STRING), sizeof(stc.identification)));
 	memset(stc.reserved, 0, SCTP_RESERVE_SPACE);
 	/* now the chunk header */
 	initack->ch.chunk_type = SCTP_INITIATION_ACK;
 	initack->ch.chunk_flags = 0;
 	/* fill in later from mbuf we build */
 	initack->ch.chunk_length = 0;
 	/* place in my tag */
 	if ((asoc != NULL) &&
 	    ((SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_WAIT) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_INUSE) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_ECHOED))) {
 		/* re-use the v-tags and init-seq here */
 		initack->init.initiate_tag = htonl(asoc->my_vtag);
 		initack->init.initial_tsn = htonl(asoc->init_seq_number);
 	} else {
 		uint32_t vtag, itsn;
 
 		if (asoc) {
 			atomic_add_int(&asoc->refcnt, 1);
 			SCTP_TCB_UNLOCK(stcb);
 	new_tag:
 			SCTP_INP_INFO_RLOCK();
 			vtag = sctp_select_a_tag(inp, inp->sctp_lport, sh->src_port, 1);
 			SCTP_INP_INFO_RUNLOCK();
 			if ((asoc->peer_supports_nat) && (vtag == asoc->my_vtag)) {
 				/*
 				 * Got a duplicate vtag on some guy behind a
 				 * nat make sure we don't use it.
 				 */
 				goto new_tag;
 			}
 			initack->init.initiate_tag = htonl(vtag);
 			/* get a TSN to use too */
 			itsn = sctp_select_initial_TSN(&inp->sctp_ep);
 			initack->init.initial_tsn = htonl(itsn);
 			SCTP_TCB_LOCK(stcb);
 			atomic_subtract_int(&asoc->refcnt, 1);
 		} else {
 			SCTP_INP_INCR_REF(inp);
 			SCTP_INP_RUNLOCK(inp);
 			SCTP_INP_INFO_RLOCK();
 			vtag = sctp_select_a_tag(inp, inp->sctp_lport, sh->src_port, 1);
 			SCTP_INP_INFO_RUNLOCK();
 			initack->init.initiate_tag = htonl(vtag);
 			/* get a TSN to use too */
 			initack->init.initial_tsn = htonl(sctp_select_initial_TSN(&inp->sctp_ep));
 			SCTP_INP_RLOCK(inp);
 			SCTP_INP_DECR_REF(inp);
 		}
 	}
 	/* save away my tag to */
 	stc.my_vtag = initack->init.initiate_tag;
 
 	/* set up some of the credits. */
 	so = inp->sctp_socket;
 	if (so == NULL) {
 		/* memory problem */
 		sctp_m_freem(op_err);
 		sctp_m_freem(m);
 		return;
 	} else {
 		initack->init.a_rwnd = htonl(max(SCTP_SB_LIMIT_RCV(so), SCTP_MINIMAL_RWND));
 	}
 	/* set what I want */
 	his_limit = ntohs(init_chk->init.num_inbound_streams);
 	/* choose what I want */
 	if (asoc != NULL) {
 		if (asoc->streamoutcnt > asoc->pre_open_streams) {
 			i_want = asoc->streamoutcnt;
 		} else {
 			i_want = asoc->pre_open_streams;
 		}
 	} else {
 		i_want = inp->sctp_ep.pre_open_stream_count;
 	}
 	if (his_limit < i_want) {
 		/* I Want more :< */
 		initack->init.num_outbound_streams = init_chk->init.num_inbound_streams;
 	} else {
 		/* I can have what I want :> */
 		initack->init.num_outbound_streams = htons(i_want);
 	}
 	/* tell him his limit. */
 	initack->init.num_inbound_streams =
 	    htons(inp->sctp_ep.max_open_streams_intome);
 
 	/* adaptation layer indication parameter */
 	if (inp->sctp_ep.adaptation_layer_indicator_provided) {
 		parameter_len = (uint16_t)sizeof(struct sctp_adaptation_layer_indication);
 		ali = (struct sctp_adaptation_layer_indication *)(mtod(m, caddr_t)+chunk_len);
 		ali->ph.param_type = htons(SCTP_ULP_ADAPTATION);
 		ali->ph.param_length = htons(parameter_len);
 		ali->indication = htonl(inp->sctp_ep.adaptation_layer_indicator);
 		chunk_len += parameter_len;
 	}
 
 	/* ECN parameter */
 	if (((asoc != NULL) && (asoc->ecn_supported == 1)) ||
 	    ((asoc == NULL) && (inp->ecn_supported == 1))) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_ECN_CAPABLE);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* PR-SCTP supported parameter */
 	if (((asoc != NULL) && (asoc->prsctp_supported == 1)) ||
 	    ((asoc == NULL) && (inp->prsctp_supported == 1))) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_PRSCTP_SUPPORTED);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* Zero checksum acceptable parameter */
 	if (((asoc != NULL) && (asoc->zero_checksum > 0)) ||
 	    ((asoc == NULL) && (inp->zero_checksum == 1))) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_ZERO_CHECKSUM_ACCEPTABLE);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* Add NAT friendly parameter */
 	if (nat_friendly) {
 		parameter_len = (uint16_t)sizeof(struct sctp_paramhdr);
 		ph = (struct sctp_paramhdr *)(mtod(m, caddr_t)+chunk_len);
 		ph->param_type = htons(SCTP_HAS_NAT_SUPPORT);
 		ph->param_length = htons(parameter_len);
 		chunk_len += parameter_len;
 	}
 
 	/* And now tell the peer which extensions we support */
 	num_ext = 0;
 	pr_supported = (struct sctp_supported_chunk_types_param *)(mtod(m, caddr_t)+chunk_len);
 	if (((asoc != NULL) && (asoc->prsctp_supported == 1)) ||
 	    ((asoc == NULL) && (inp->prsctp_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_FORWARD_CUM_TSN;
 		if (((asoc != NULL) && (asoc->idata_supported == 1)) ||
 		    ((asoc == NULL) && (inp->idata_supported == 1))) {
 			pr_supported->chunk_types[num_ext++] = SCTP_IFORWARD_CUM_TSN;
 		}
 	}
 	if (((asoc != NULL) && (asoc->auth_supported == 1)) ||
 	    ((asoc == NULL) && (inp->auth_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_AUTHENTICATION;
 	}
 	if (((asoc != NULL) && (asoc->asconf_supported == 1)) ||
 	    ((asoc == NULL) && (inp->asconf_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_ASCONF;
 		pr_supported->chunk_types[num_ext++] = SCTP_ASCONF_ACK;
 	}
 	if (((asoc != NULL) && (asoc->reconfig_supported == 1)) ||
 	    ((asoc == NULL) && (inp->reconfig_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_STREAM_RESET;
 	}
 	if (((asoc != NULL) && (asoc->idata_supported == 1)) ||
 	    ((asoc == NULL) && (inp->idata_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_IDATA;
 	}
 	if (((asoc != NULL) && (asoc->nrsack_supported == 1)) ||
 	    ((asoc == NULL) && (inp->nrsack_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_NR_SELECTIVE_ACK;
 	}
 	if (((asoc != NULL) && (asoc->pktdrop_supported == 1)) ||
 	    ((asoc == NULL) && (inp->pktdrop_supported == 1))) {
 		pr_supported->chunk_types[num_ext++] = SCTP_PACKET_DROPPED;
 	}
 	if (num_ext > 0) {
 		parameter_len = (uint16_t)sizeof(struct sctp_supported_chunk_types_param) + num_ext;
 		pr_supported->ph.param_type = htons(SCTP_SUPPORTED_CHUNK_EXT);
 		pr_supported->ph.param_length = htons(parameter_len);
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		chunk_len += parameter_len;
 	}
 
 	/* add authentication parameters */
 	if (((asoc != NULL) && (asoc->auth_supported == 1)) ||
 	    ((asoc == NULL) && (inp->auth_supported == 1))) {
 		struct sctp_auth_random *randp;
 		struct sctp_auth_hmac_algo *hmacs;
 		struct sctp_auth_chunk_list *chunks;
 
 		if (padding_len > 0) {
 			memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 			chunk_len += padding_len;
 			padding_len = 0;
 		}
 		/* generate and add RANDOM parameter */
 		randp = (struct sctp_auth_random *)(mtod(m, caddr_t)+chunk_len);
 		parameter_len = (uint16_t)sizeof(struct sctp_auth_random) +
 		    SCTP_AUTH_RANDOM_SIZE_DEFAULT;
 		randp->ph.param_type = htons(SCTP_RANDOM);
 		randp->ph.param_length = htons(parameter_len);
 		SCTP_READ_RANDOM(randp->random_data, SCTP_AUTH_RANDOM_SIZE_DEFAULT);
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		chunk_len += parameter_len;
 
 		if (padding_len > 0) {
 			memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 			chunk_len += padding_len;
 			padding_len = 0;
 		}
 		/* add HMAC_ALGO parameter */
 		hmacs = (struct sctp_auth_hmac_algo *)(mtod(m, caddr_t)+chunk_len);
 		parameter_len = (uint16_t)sizeof(struct sctp_auth_hmac_algo) +
 		    sctp_serialize_hmaclist(inp->sctp_ep.local_hmacs,
 		    (uint8_t *)hmacs->hmac_ids);
 		hmacs->ph.param_type = htons(SCTP_HMAC_LIST);
 		hmacs->ph.param_length = htons(parameter_len);
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		chunk_len += parameter_len;
 
 		if (padding_len > 0) {
 			memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 			chunk_len += padding_len;
 			padding_len = 0;
 		}
 		/* add CHUNKS parameter */
 		chunks = (struct sctp_auth_chunk_list *)(mtod(m, caddr_t)+chunk_len);
 		parameter_len = (uint16_t)sizeof(struct sctp_auth_chunk_list) +
 		    sctp_serialize_auth_chunks(inp->sctp_ep.local_auth_chunks,
 		    chunks->chunk_types);
 		chunks->ph.param_type = htons(SCTP_CHUNK_LIST);
 		chunks->ph.param_length = htons(parameter_len);
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		chunk_len += parameter_len;
 	}
 	SCTP_BUF_LEN(m) = chunk_len;
 	m_last = m;
 	/* now the addresses */
 	/*
 	 * To optimize this we could put the scoping stuff into a structure
 	 * and remove the individual uint8's from the stc structure. Then we
 	 * could just sifa in the address within the stc.. but for now this
 	 * is a quick hack to get the address stuff teased apart.
 	 */
 	scp.ipv4_addr_legal = stc.ipv4_addr_legal;
 	scp.ipv6_addr_legal = stc.ipv6_addr_legal;
 	scp.loopback_scope = stc.loopback_scope;
 	scp.ipv4_local_scope = stc.ipv4_scope;
 	scp.local_scope = stc.local_scope;
 	scp.site_scope = stc.site_scope;
 	m_last = sctp_add_addresses_to_i_ia(inp, stcb, &scp, m_last,
 	    cnt_inits_to,
 	    &padding_len, &chunk_len);
 	/* padding_len can only be positive, if no addresses have been added */
 	if (padding_len > 0) {
 		memset(mtod(m, caddr_t)+chunk_len, 0, padding_len);
 		chunk_len += padding_len;
 		SCTP_BUF_LEN(m) += padding_len;
 		padding_len = 0;
 	}
 
 	/* tack on the operational error if present */
 	if (op_err) {
 		parameter_len = 0;
 		for (m_tmp = op_err; m_tmp != NULL; m_tmp = SCTP_BUF_NEXT(m_tmp)) {
 			parameter_len += SCTP_BUF_LEN(m_tmp);
 		}
 		padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 		SCTP_BUF_NEXT(m_last) = op_err;
 		while (SCTP_BUF_NEXT(m_last) != NULL) {
 			m_last = SCTP_BUF_NEXT(m_last);
 		}
 		chunk_len += parameter_len;
 	}
 	if (padding_len > 0) {
 		m_last = sctp_add_pad_tombuf(m_last, padding_len);
 		if (m_last == NULL) {
 			/* Houston we have a problem, no space */
 			sctp_m_freem(m);
 			return;
 		}
 		chunk_len += padding_len;
 		padding_len = 0;
 	}
 	/* Now we must build a cookie */
 	m_cookie = sctp_add_cookie(init_pkt, offset, m, 0, &stc, &signature);
 	if (m_cookie == NULL) {
 		/* memory problem */
 		sctp_m_freem(m);
 		return;
 	}
 	/* Now append the cookie to the end and update the space/size */
 	SCTP_BUF_NEXT(m_last) = m_cookie;
 	parameter_len = 0;
 	for (m_tmp = m_cookie; m_tmp != NULL; m_tmp = SCTP_BUF_NEXT(m_tmp)) {
 		parameter_len += SCTP_BUF_LEN(m_tmp);
 		if (SCTP_BUF_NEXT(m_tmp) == NULL) {
 			m_last = m_tmp;
 		}
 	}
 	padding_len = SCTP_SIZE32(parameter_len) - parameter_len;
 	chunk_len += parameter_len;
 
 	/*
 	 * Place in the size, but we don't include the last pad (if any) in
 	 * the INIT-ACK.
 	 */
 	initack->ch.chunk_length = htons(chunk_len);
 
 	/*
 	 * Time to sign the cookie, we don't sign over the cookie signature
 	 * though thus we set trailer.
 	 */
 	(void)sctp_hmac_m(SCTP_HMAC,
 	    (uint8_t *)inp->sctp_ep.secret_key[(int)(inp->sctp_ep.current_secret_number)],
 	    SCTP_SECRET_SIZE, m_cookie, sizeof(struct sctp_paramhdr),
 	    (uint8_t *)signature, SCTP_SIGNATURE_SIZE);
 	/*
 	 * We sifa 0 here to NOT set IP_DF if its IPv4, we ignore the return
 	 * here since the timer will drive a retranmission.
 	 */
 	if (padding_len > 0) {
 		if (sctp_add_pad_tombuf(m_last, padding_len) == NULL) {
 			sctp_m_freem(m);
 			return;
 		}
 	}
 	if (stc.loopback_scope) {
 		over_addr = (union sctp_sockstore *)dst;
 	} else {
 		over_addr = NULL;
 	}
 
 	if ((error = sctp_lowlevel_chunk_output(inp, NULL, NULL, to, m, 0, NULL, 0, 0,
 	    0, 0,
 	    inp->sctp_lport, sh->src_port, init_chk->init.initiate_tag,
 	    port, over_addr,
 	    mflowtype, mflowid,
 	    false,		/* XXXMT: Improve this! */
 	    SCTP_SO_NOT_LOCKED))) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT4, "Gak send error %d\n", error);
 		if (error == ENOBUFS) {
 			if (asoc != NULL) {
 				asoc->ifp_had_enobuf = 1;
 			}
 			SCTP_STAT_INCR(sctps_lowlevelerr);
 		}
 	} else {
 		if (asoc != NULL) {
 			asoc->ifp_had_enobuf = 0;
 		}
 	}
 	SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 }
 
 static void
 sctp_prune_prsctp(struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     struct sctp_nonpad_sndrcvinfo *srcv,
     int dataout)
 {
 	int freed_spc = 0;
 	struct sctp_tmit_chunk *chk, *nchk;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if ((asoc->prsctp_supported) &&
 	    (asoc->sent_queue_cnt_removeable > 0)) {
 		TAILQ_FOREACH(chk, &asoc->sent_queue, sctp_next) {
 			/*
 			 * Look for chunks marked with the PR_SCTP flag AND
 			 * the buffer space flag. If the one being sent is
 			 * equal or greater priority then purge the old one
 			 * and free some space.
 			 */
 			if (PR_SCTP_BUF_ENABLED(chk->flags)) {
 				/*
 				 * This one is PR-SCTP AND buffer space
 				 * limited type
 				 */
 				if (chk->rec.data.timetodrop.tv_sec > (long)srcv->sinfo_timetolive) {
 					/*
 					 * Lower numbers equates to higher
 					 * priority. So if the one we are
 					 * looking at has a larger priority,
 					 * we want to drop the data and NOT
 					 * retransmit it.
 					 */
 					if (chk->data) {
 						/*
 						 * We release the book_size
 						 * if the mbuf is here
 						 */
 						int ret_spc;
 						uint8_t sent;
 
 						if (chk->sent > SCTP_DATAGRAM_UNSENT)
 							sent = 1;
 						else
 							sent = 0;
 						ret_spc = sctp_release_pr_sctp_chunk(stcb, chk,
 						    sent,
 						    SCTP_SO_LOCKED);
 						freed_spc += ret_spc;
 						if (freed_spc >= dataout) {
 							return;
 						}
 					}	/* if chunk was present */
 				}	/* if of sufficient priority */
 			}	/* if chunk has enabled */
 		}		/* tailqforeach */
 
 		TAILQ_FOREACH_SAFE(chk, &asoc->send_queue, sctp_next, nchk) {
 			/* Here we must move to the sent queue and mark */
 			if (PR_SCTP_BUF_ENABLED(chk->flags)) {
 				if (chk->rec.data.timetodrop.tv_sec > (long)srcv->sinfo_timetolive) {
 					if (chk->data) {
 						/*
 						 * We release the book_size
 						 * if the mbuf is here
 						 */
 						int ret_spc;
 
 						ret_spc = sctp_release_pr_sctp_chunk(stcb, chk,
 						    0, SCTP_SO_LOCKED);
 
 						freed_spc += ret_spc;
 						if (freed_spc >= dataout) {
 							return;
 						}
 					}	/* end if chk->data */
 				}	/* end if right class */
 			}	/* end if chk pr-sctp */
 		}		/* tailqforeachsafe (chk) */
 	}			/* if enabled in asoc */
 }
 
 uint32_t
 sctp_get_frag_point(struct sctp_tcb *stcb)
 {
 	struct sctp_association *asoc;
 	uint32_t frag_point, overhead;
 
 	asoc = &stcb->asoc;
 	/* Consider IP header and SCTP common header. */
 	if (stcb->sctp_ep->sctp_flags & SCTP_PCB_FLAGS_BOUND_V6) {
 		overhead = SCTP_MIN_OVERHEAD;
 	} else {
 		overhead = SCTP_MIN_V4_OVERHEAD;
 	}
 	/* Consider DATA/IDATA chunk header and AUTH header, if needed. */
 	if (asoc->idata_supported) {
 		overhead += sizeof(struct sctp_idata_chunk);
 		if (sctp_auth_is_required_chunk(SCTP_IDATA, asoc->peer_auth_chunks)) {
 			overhead += sctp_get_auth_chunk_len(asoc->peer_hmac_id);
 		}
 	} else {
 		overhead += sizeof(struct sctp_data_chunk);
 		if (sctp_auth_is_required_chunk(SCTP_DATA, asoc->peer_auth_chunks)) {
 			overhead += sctp_get_auth_chunk_len(asoc->peer_hmac_id);
 		}
 	}
 	KASSERT(overhead % 4 == 0,
 	    ("overhead (%u) not a multiple of 4", overhead));
 	/* Consider padding. */
 	if (asoc->smallest_mtu % 4 > 0) {
 		overhead += (asoc->smallest_mtu % 4);
 	}
 	KASSERT(asoc->smallest_mtu > overhead,
 	    ("Association MTU (%u) too small for overhead (%u)",
 	    asoc->smallest_mtu, overhead));
 	frag_point = asoc->smallest_mtu - overhead;
 	KASSERT(frag_point % 4 == 0,
 	    ("frag_point (%u) not a multiple of 4", frag_point));
 	/* Honor MAXSEG socket option. */
 	if ((asoc->sctp_frag_point > 0) &&
 	    (asoc->sctp_frag_point < frag_point)) {
 		frag_point = asoc->sctp_frag_point;
 	}
 	return (frag_point);
 }
 
 static void
 sctp_set_prsctp_policy(struct sctp_stream_queue_pending *sp)
 {
 	/*
 	 * We assume that the user wants PR_SCTP_TTL if the user provides a
 	 * positive lifetime but does not specify any PR_SCTP policy.
 	 */
 	if (PR_SCTP_ENABLED(sp->sinfo_flags)) {
 		sp->act_flags |= PR_SCTP_POLICY(sp->sinfo_flags);
 	} else if (sp->timetolive > 0) {
 		sp->sinfo_flags |= SCTP_PR_SCTP_TTL;
 		sp->act_flags |= PR_SCTP_POLICY(sp->sinfo_flags);
 	} else {
 		return;
 	}
 	switch (PR_SCTP_POLICY(sp->sinfo_flags)) {
 	case CHUNK_FLAGS_PR_SCTP_BUF:
 		/*
 		 * Time to live is a priority stored in tv_sec when doing
 		 * the buffer drop thing.
 		 */
 		sp->ts.tv_sec = sp->timetolive;
 		sp->ts.tv_usec = 0;
 		break;
 	case CHUNK_FLAGS_PR_SCTP_TTL:
 		{
 			struct timeval tv;
 
 			(void)SCTP_GETTIME_TIMEVAL(&sp->ts);
 			tv.tv_sec = sp->timetolive / 1000;
 			tv.tv_usec = (sp->timetolive * 1000) % 1000000;
 			/*
 			 * TODO sctp_constants.h needs alternative time
 			 * macros when _KERNEL is undefined.
 			 */
 			timevaladd(&sp->ts, &tv);
 		}
 		break;
 	case CHUNK_FLAGS_PR_SCTP_RTX:
 		/*
 		 * Time to live is a the number or retransmissions stored in
 		 * tv_sec.
 		 */
 		sp->ts.tv_sec = sp->timetolive;
 		sp->ts.tv_usec = 0;
 		break;
 	default:
 		SCTPDBG(SCTP_DEBUG_USRREQ1,
 		    "Unknown PR_SCTP policy %u.\n",
 		    PR_SCTP_POLICY(sp->sinfo_flags));
 		break;
 	}
 }
 
 static int
 sctp_msg_append(struct sctp_tcb *stcb,
     struct sctp_nets *net,
     struct mbuf *m,
     struct sctp_nonpad_sndrcvinfo *srcv)
 {
 	int error = 0;
 	struct mbuf *at;
 	struct sctp_stream_queue_pending *sp = NULL;
 	struct sctp_stream_out *strm;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	/*
 	 * Given an mbuf chain, put it into the association send queue and
 	 * place it on the wheel
 	 */
 	if (srcv->sinfo_stream >= stcb->asoc.streamoutcnt) {
 		/* Invalid stream number */
 		SCTP_LTRACE_ERR_RET_PKT(m, NULL, stcb, net, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		error = EINVAL;
 		goto out_now;
 	}
 	if ((stcb->asoc.stream_locked) &&
 	    (stcb->asoc.stream_locked_on != srcv->sinfo_stream)) {
 		SCTP_LTRACE_ERR_RET_PKT(m, NULL, stcb, net, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		error = EINVAL;
 		goto out_now;
 	}
 	if ((stcb->asoc.strmout[srcv->sinfo_stream].state != SCTP_STREAM_OPEN) &&
 	    (stcb->asoc.strmout[srcv->sinfo_stream].state != SCTP_STREAM_OPENING)) {
 		/*
 		 * Can't queue any data while stream reset is underway.
 		 */
 		if (stcb->asoc.strmout[srcv->sinfo_stream].state > SCTP_STREAM_OPEN) {
 			error = EAGAIN;
 		} else {
 			error = EINVAL;
 		}
 		goto out_now;
 	}
 	/* Now can we send this? */
 	if ((SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_SENT) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_ACK_SENT) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_RECEIVED) ||
 	    (stcb->asoc.state & SCTP_STATE_SHUTDOWN_PENDING)) {
 		/* got data while shutting down */
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EPIPE);
 		error = EPIPE;
 		goto out_now;
 	}
 	sctp_alloc_a_strmoq(stcb, sp);
 	if (sp == NULL) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		error = ENOMEM;
 		goto out_now;
 	}
 	sp->sinfo_flags = srcv->sinfo_flags;
 	sp->timetolive = srcv->sinfo_timetolive;
 	sp->ppid = srcv->sinfo_ppid;
 	sp->context = srcv->sinfo_context;
 	sp->fsn = 0;
 	if (sp->sinfo_flags & SCTP_ADDR_OVER) {
 		sp->net = net;
 		atomic_add_int(&sp->net->ref_count, 1);
 	} else {
 		sp->net = NULL;
 	}
 	(void)SCTP_GETTIME_TIMEVAL(&sp->ts);
 	sp->sid = srcv->sinfo_stream;
 	sp->msg_is_complete = 1;
 	sp->sender_all_done = 1;
 	sp->some_taken = 0;
 	sp->data = m;
 	sp->tail_mbuf = NULL;
 	sctp_set_prsctp_policy(sp);
 	/*
 	 * We could in theory (for sendall) sifa the length in, but we would
 	 * still have to hunt through the chain since we need to setup the
 	 * tail_mbuf
 	 */
 	sp->length = 0;
 	for (at = m; at; at = SCTP_BUF_NEXT(at)) {
 		if (SCTP_BUF_NEXT(at) == NULL)
 			sp->tail_mbuf = at;
 		sp->length += SCTP_BUF_LEN(at);
 	}
 	if (srcv->sinfo_keynumber_valid) {
 		sp->auth_keyid = srcv->sinfo_keynumber;
 	} else {
 		sp->auth_keyid = stcb->asoc.authinfo.active_keyid;
 	}
 	if (sctp_auth_is_required_chunk(SCTP_DATA, stcb->asoc.peer_auth_chunks)) {
 		sctp_auth_key_acquire(stcb, sp->auth_keyid);
 		sp->holds_key_ref = 1;
 	}
 	strm = &stcb->asoc.strmout[srcv->sinfo_stream];
 	sctp_snd_sb_alloc(stcb, sp->length);
 	atomic_add_int(&stcb->asoc.stream_queue_cnt, 1);
 	TAILQ_INSERT_TAIL(&strm->outqueue, sp, next);
 	stcb->asoc.ss_functions.sctp_ss_add_to_stream(stcb, &stcb->asoc, strm, sp);
 	m = NULL;
 out_now:
 	if (m) {
 		sctp_m_freem(m);
 	}
 	return (error);
 }
 
 static struct mbuf *
 sctp_copy_mbufchain(struct mbuf *clonechain,
     struct mbuf *outchain,
     struct mbuf **endofchain,
     int can_take_mbuf,
     int sizeofcpy,
     uint8_t copy_by_ref)
 {
 	struct mbuf *m;
 	struct mbuf *appendchain;
 	caddr_t cp;
 	int len;
 
 	if (endofchain == NULL) {
 		/* error */
 error_out:
 		if (outchain)
 			sctp_m_freem(outchain);
 		return (NULL);
 	}
 	if (can_take_mbuf) {
 		appendchain = clonechain;
 	} else {
 		if (!copy_by_ref &&
 		    (sizeofcpy <= (int)((((SCTP_BASE_SYSCTL(sctp_mbuf_threshold_count) - 1) * MLEN) + MHLEN)))) {
 			/* Its not in a cluster */
 			if (*endofchain == NULL) {
 				/* lets get a mbuf cluster */
 				if (outchain == NULL) {
 					/* This is the general case */
 			new_mbuf:
 					outchain = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_HEADER);
 					if (outchain == NULL) {
 						goto error_out;
 					}
 					SCTP_BUF_LEN(outchain) = 0;
 					*endofchain = outchain;
 					/* get the prepend space */
 					SCTP_BUF_RESV_UF(outchain, (SCTP_FIRST_MBUF_RESV + 4));
 				} else {
 					/*
 					 * We really should not get a NULL
 					 * in endofchain
 					 */
 					/* find end */
 					m = outchain;
 					while (m) {
 						if (SCTP_BUF_NEXT(m) == NULL) {
 							*endofchain = m;
 							break;
 						}
 						m = SCTP_BUF_NEXT(m);
 					}
 					/* sanity */
 					if (*endofchain == NULL) {
 						/*
 						 * huh, TSNH XXX maybe we
 						 * should panic
 						 */
 						sctp_m_freem(outchain);
 						goto new_mbuf;
 					}
 				}
 				/* get the new end of length */
 				len = (int)M_TRAILINGSPACE(*endofchain);
 			} else {
 				/* how much is left at the end? */
 				len = (int)M_TRAILINGSPACE(*endofchain);
 			}
 			/* Find the end of the data, for appending */
 			cp = (mtod((*endofchain), caddr_t)+SCTP_BUF_LEN((*endofchain)));
 
 			/* Now lets copy it out */
 			if (len >= sizeofcpy) {
 				/* It all fits, copy it in */
 				m_copydata(clonechain, 0, sizeofcpy, cp);
 				SCTP_BUF_LEN((*endofchain)) += sizeofcpy;
 			} else {
 				/* fill up the end of the chain */
 				if (len > 0) {
 					m_copydata(clonechain, 0, len, cp);
 					SCTP_BUF_LEN((*endofchain)) += len;
 					/* now we need another one */
 					sizeofcpy -= len;
 				}
 				m = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_HEADER);
 				if (m == NULL) {
 					/* We failed */
 					goto error_out;
 				}
 				SCTP_BUF_NEXT((*endofchain)) = m;
 				*endofchain = m;
 				cp = mtod((*endofchain), caddr_t);
 				m_copydata(clonechain, len, sizeofcpy, cp);
 				SCTP_BUF_LEN((*endofchain)) += sizeofcpy;
 			}
 			return (outchain);
 		} else {
 			/* copy the old fashion way */
 			appendchain = SCTP_M_COPYM(clonechain, 0, M_COPYALL, M_NOWAIT);
 #ifdef SCTP_MBUF_LOGGING
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 				sctp_log_mbc(appendchain, SCTP_MBUF_ICOPY);
 			}
 #endif
 		}
 	}
 	if (appendchain == NULL) {
 		/* error */
 		if (outchain)
 			sctp_m_freem(outchain);
 		return (NULL);
 	}
 	if (outchain) {
 		/* tack on to the end */
 		if (*endofchain != NULL) {
 			SCTP_BUF_NEXT(((*endofchain))) = appendchain;
 		} else {
 			m = outchain;
 			while (m) {
 				if (SCTP_BUF_NEXT(m) == NULL) {
 					SCTP_BUF_NEXT(m) = appendchain;
 					break;
 				}
 				m = SCTP_BUF_NEXT(m);
 			}
 		}
 		/*
 		 * save off the end and update the end-chain position
 		 */
 		m = appendchain;
 		while (m) {
 			if (SCTP_BUF_NEXT(m) == NULL) {
 				*endofchain = m;
 				break;
 			}
 			m = SCTP_BUF_NEXT(m);
 		}
 		return (outchain);
 	} else {
 		/* save off the end and update the end-chain position */
 		m = appendchain;
 		while (m) {
 			if (SCTP_BUF_NEXT(m) == NULL) {
 				*endofchain = m;
 				break;
 			}
 			m = SCTP_BUF_NEXT(m);
 		}
 		return (appendchain);
 	}
 }
 
 static int
 sctp_med_chunk_output(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     int *num_out,
     int *reason_code,
     int control_only, int from_where,
     struct timeval *now, int *now_filled,
     uint32_t frag_point, int so_locked);
 
 static void
 sctp_sendall_iterator(struct sctp_inpcb *inp, struct sctp_tcb *stcb, void *ptr,
     uint32_t val SCTP_UNUSED)
 {
 	struct sctp_copy_all *ca;
 	struct mbuf *m;
 	int ret = 0;
 	int added_control = 0;
 	int un_sent, do_chunk_output = 1;
 	struct sctp_association *asoc;
 	struct sctp_nets *net;
 
 	ca = (struct sctp_copy_all *)ptr;
 	if (ca->m == NULL) {
 		return;
 	}
 	if (ca->inp != inp) {
 		/* TSNH */
 		return;
 	}
 	if (ca->sndlen > 0) {
 		m = SCTP_M_COPYM(ca->m, 0, M_COPYALL, M_NOWAIT);
 		if (m == NULL) {
 			/* can't copy so we are done */
 			ca->cnt_failed++;
 			return;
 		}
 #ifdef SCTP_MBUF_LOGGING
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 			sctp_log_mbc(m, SCTP_MBUF_ICOPY);
 		}
 #endif
 	} else {
 		m = NULL;
 	}
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if (stcb->asoc.alternate) {
 		net = stcb->asoc.alternate;
 	} else {
 		net = stcb->asoc.primary_destination;
 	}
 	if (ca->sndrcv.sinfo_flags & SCTP_ABORT) {
 		/* Abort this assoc with m as the user defined reason */
 		if (m != NULL) {
 			SCTP_BUF_PREPEND(m, sizeof(struct sctp_paramhdr), M_NOWAIT);
 		} else {
 			m = sctp_get_mbuf_for_msg(sizeof(struct sctp_paramhdr),
 			    0, M_NOWAIT, 1, MT_DATA);
 			SCTP_BUF_LEN(m) = sizeof(struct sctp_paramhdr);
 		}
 		if (m != NULL) {
 			struct sctp_paramhdr *ph;
 
 			ph = mtod(m, struct sctp_paramhdr *);
 			ph->param_type = htons(SCTP_CAUSE_USER_INITIATED_ABT);
 			ph->param_length = htons((uint16_t)(sizeof(struct sctp_paramhdr) + ca->sndlen));
 		}
 		/*
 		 * We add one here to keep the assoc from dis-appearing on
 		 * us.
 		 */
 		atomic_add_int(&stcb->asoc.refcnt, 1);
 		sctp_abort_an_association(inp, stcb, m, false, SCTP_SO_NOT_LOCKED);
 		/*
 		 * sctp_abort_an_association calls sctp_free_asoc() free
 		 * association will NOT free it since we incremented the
 		 * refcnt .. we do this to prevent it being freed and things
 		 * getting tricky since we could end up (from free_asoc)
 		 * calling inpcb_free which would get a recursive lock call
 		 * to the iterator lock.. But as a consequence of that the
 		 * stcb will return to us un-locked.. since free_asoc
 		 * returns with either no TCB or the TCB unlocked, we must
 		 * relock.. to unlock in the iterator timer :-0
 		 */
 		SCTP_TCB_LOCK(stcb);
 		atomic_subtract_int(&stcb->asoc.refcnt, 1);
 		goto no_chunk_output;
 	} else {
 		if (m != NULL) {
 			ret = sctp_msg_append(stcb, net, m, &ca->sndrcv);
 		}
 		asoc = &stcb->asoc;
 		if (ca->sndrcv.sinfo_flags & SCTP_EOF) {
 			/* shutdown this assoc */
 			if (TAILQ_EMPTY(&asoc->send_queue) &&
 			    TAILQ_EMPTY(&asoc->sent_queue) &&
 			    sctp_is_there_unsent_data(stcb, SCTP_SO_NOT_LOCKED) == 0) {
 				if ((*asoc->ss_functions.sctp_ss_is_user_msgs_incomplete) (stcb, asoc)) {
 					goto abort_anyway;
 				}
 				/*
 				 * there is nothing queued to send, so I'm
 				 * done...
 				 */
 				if ((SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_SENT) &&
 				    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_RECEIVED) &&
 				    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_ACK_SENT)) {
 					/*
 					 * only send SHUTDOWN the first time
 					 * through
 					 */
 					if (SCTP_GET_STATE(stcb) == SCTP_STATE_OPEN) {
 						SCTP_STAT_DECR_GAUGE32(sctps_currestab);
 					}
 					SCTP_SET_STATE(stcb, SCTP_STATE_SHUTDOWN_SENT);
 					sctp_stop_timers_for_shutdown(stcb);
 					sctp_send_shutdown(stcb, net);
 					sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWN, stcb->sctp_ep, stcb,
 					    net);
 					sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWNGUARD, stcb->sctp_ep, stcb,
 					    NULL);
 					added_control = 1;
 					do_chunk_output = 0;
 				}
 			} else {
 				/*
 				 * we still got (or just got) data to send,
 				 * so set SHUTDOWN_PENDING
 				 */
 				/*
 				 * XXX sockets draft says that SCTP_EOF
 				 * should be sent with no data.  currently,
 				 * we will allow user data to be sent first
 				 * and move to SHUTDOWN-PENDING
 				 */
 				if ((SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_SENT) &&
 				    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_RECEIVED) &&
 				    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_ACK_SENT)) {
 					if ((*asoc->ss_functions.sctp_ss_is_user_msgs_incomplete) (stcb, asoc)) {
 						SCTP_ADD_SUBSTATE(stcb, SCTP_STATE_PARTIAL_MSG_LEFT);
 					}
 					SCTP_ADD_SUBSTATE(stcb, SCTP_STATE_SHUTDOWN_PENDING);
 					if (TAILQ_EMPTY(&asoc->send_queue) &&
 					    TAILQ_EMPTY(&asoc->sent_queue) &&
 					    (asoc->state & SCTP_STATE_PARTIAL_MSG_LEFT)) {
 						struct mbuf *op_err;
 						char msg[SCTP_DIAG_INFO_LEN];
 
 				abort_anyway:
 						SCTP_SNPRINTF(msg, sizeof(msg),
 						    "%s:%d at %s", __FILE__, __LINE__, __func__);
 						op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
 						    msg);
 						atomic_add_int(&stcb->asoc.refcnt, 1);
 						sctp_abort_an_association(stcb->sctp_ep, stcb,
 						    op_err, false, SCTP_SO_NOT_LOCKED);
 						atomic_subtract_int(&stcb->asoc.refcnt, 1);
 						goto no_chunk_output;
 					}
 				}
 			}
 		}
 	}
 	un_sent = ((stcb->asoc.total_output_queue_size - stcb->asoc.total_flight) +
 	    (stcb->asoc.stream_queue_cnt * SCTP_DATA_CHUNK_OVERHEAD(stcb)));
 
 	if ((sctp_is_feature_off(inp, SCTP_PCB_FLAGS_NODELAY)) &&
 	    (stcb->asoc.total_flight > 0) &&
 	    (un_sent < (int)(stcb->asoc.smallest_mtu - SCTP_MIN_OVERHEAD))) {
 		do_chunk_output = 0;
 	}
 	if (do_chunk_output)
 		sctp_chunk_output(inp, stcb, SCTP_OUTPUT_FROM_USR_SEND, SCTP_SO_NOT_LOCKED);
 	else if (added_control) {
 		struct timeval now;
 		int num_out, reason, now_filled = 0;
 
 		(void)sctp_med_chunk_output(inp, stcb, &stcb->asoc, &num_out,
 		    &reason, 1, 1, &now, &now_filled,
 		    sctp_get_frag_point(stcb),
 		    SCTP_SO_NOT_LOCKED);
 	}
 no_chunk_output:
 	if (ret) {
 		ca->cnt_failed++;
 	} else {
 		ca->cnt_sent++;
 	}
 }
 
 static void
 sctp_sendall_completes(void *ptr, uint32_t val SCTP_UNUSED)
 {
 	struct sctp_copy_all *ca;
 
 	ca = (struct sctp_copy_all *)ptr;
 	/*
 	 * Do a notify here? Kacheong suggests that the notify be done at
 	 * the send time.. so you would push up a notification if any send
 	 * failed. Don't know if this is feasible since the only failures we
 	 * have is "memory" related and if you cannot get an mbuf to send
 	 * the data you surely can't get an mbuf to send up to notify the
 	 * user you can't send the data :->
 	 */
 
 	/* now free everything */
 	if (ca->inp) {
 		/* Lets clear the flag to allow others to run. */
 		SCTP_INP_WLOCK(ca->inp);
 		ca->inp->sctp_flags &= ~SCTP_PCB_FLAGS_SND_ITERATOR_UP;
 		SCTP_INP_WUNLOCK(ca->inp);
 	}
 	sctp_m_freem(ca->m);
 	SCTP_FREE(ca, SCTP_M_COPYAL);
 }
 
 static struct mbuf *
 sctp_copy_out_all(struct uio *uio, ssize_t len)
 {
 	struct mbuf *ret, *at;
 	ssize_t left, willcpy, cancpy, error;
 
 	ret = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_WAITOK, 1, MT_DATA);
 	if (ret == NULL) {
 		/* TSNH */
 		return (NULL);
 	}
 	left = len;
 	SCTP_BUF_LEN(ret) = 0;
 	/* save space for the data chunk header */
 	cancpy = (int)M_TRAILINGSPACE(ret);
 	willcpy = min(cancpy, left);
 	at = ret;
 	while (left > 0) {
 		/* Align data to the end */
 		error = uiomove(mtod(at, caddr_t), (int)willcpy, uio);
 		if (error) {
 	err_out_now:
 			sctp_m_freem(at);
 			return (NULL);
 		}
 		SCTP_BUF_LEN(at) = (int)willcpy;
 		SCTP_BUF_NEXT_PKT(at) = SCTP_BUF_NEXT(at) = 0;
 		left -= willcpy;
 		if (left > 0) {
 			SCTP_BUF_NEXT(at) = sctp_get_mbuf_for_msg((unsigned int)left, 0, M_WAITOK, 1, MT_DATA);
 			if (SCTP_BUF_NEXT(at) == NULL) {
 				goto err_out_now;
 			}
 			at = SCTP_BUF_NEXT(at);
 			SCTP_BUF_LEN(at) = 0;
 			cancpy = (int)M_TRAILINGSPACE(at);
 			willcpy = min(cancpy, left);
 		}
 	}
 	return (ret);
 }
 
 static int
 sctp_sendall(struct sctp_inpcb *inp, struct uio *uio, struct mbuf *m,
     struct sctp_nonpad_sndrcvinfo *srcv)
 {
 	int ret;
 	struct sctp_copy_all *ca;
 
 	if (uio->uio_resid > (ssize_t)SCTP_BASE_SYSCTL(sctp_sendall_limit)) {
 		/* You must not be larger than the limit! */
 		return (EMSGSIZE);
 	}
 	SCTP_MALLOC(ca, struct sctp_copy_all *, sizeof(struct sctp_copy_all),
 	    SCTP_M_COPYAL);
 	if (ca == NULL) {
 		sctp_m_freem(m);
 		SCTP_LTRACE_ERR_RET(inp, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	memset(ca, 0, sizeof(struct sctp_copy_all));
 
 	ca->inp = inp;
 	if (srcv != NULL) {
 		memcpy(&ca->sndrcv, srcv, sizeof(struct sctp_nonpad_sndrcvinfo));
 	}
 
 	/* Serialize. */
 	SCTP_INP_WLOCK(inp);
 	if ((inp->sctp_flags & SCTP_PCB_FLAGS_SND_ITERATOR_UP) != 0) {
 		SCTP_INP_WUNLOCK(inp);
 		sctp_m_freem(m);
 		SCTP_FREE(ca, SCTP_M_COPYAL);
 		return (EBUSY);
 	}
 	inp->sctp_flags |= SCTP_PCB_FLAGS_SND_ITERATOR_UP;
 	SCTP_INP_WUNLOCK(inp);
 
 	/*
 	 * take off the sendall flag, it would be bad if we failed to do
 	 * this :-0
 	 */
 	ca->sndrcv.sinfo_flags &= ~SCTP_SENDALL;
 	/* get length and mbuf chain */
 	if (uio) {
 		ca->sndlen = uio->uio_resid;
 		ca->m = sctp_copy_out_all(uio, ca->sndlen);
 		if (ca->m == NULL) {
 			SCTP_FREE(ca, SCTP_M_COPYAL);
 			sctp_m_freem(m);
 			SCTP_INP_WLOCK(inp);
 			inp->sctp_flags &= ~SCTP_PCB_FLAGS_SND_ITERATOR_UP;
 			SCTP_INP_WUNLOCK(inp);
 			SCTP_LTRACE_ERR_RET(inp, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 			return (ENOMEM);
 		}
 	} else {
 		/* Gather the length of the send */
 		struct mbuf *mat;
 
 		ca->sndlen = 0;
 		for (mat = m; mat; mat = SCTP_BUF_NEXT(mat)) {
 			ca->sndlen += SCTP_BUF_LEN(mat);
 		}
 	}
 	ret = sctp_initiate_iterator(NULL, sctp_sendall_iterator, NULL,
 	    SCTP_PCB_ANY_FLAGS, SCTP_PCB_ANY_FEATURES,
 	    SCTP_ASOC_ANY_STATE,
 	    (void *)ca, 0,
 	    sctp_sendall_completes, inp, 1);
 	if (ret) {
 		SCTP_INP_WLOCK(inp);
 		inp->sctp_flags &= ~SCTP_PCB_FLAGS_SND_ITERATOR_UP;
 		SCTP_INP_WUNLOCK(inp);
 		SCTP_FREE(ca, SCTP_M_COPYAL);
 		SCTP_LTRACE_ERR_RET_PKT(m, inp, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		return (EFAULT);
 	}
 	return (0);
 }
 
 void
 sctp_toss_old_cookies(struct sctp_tcb *stcb, struct sctp_association *asoc)
 {
 	struct sctp_tmit_chunk *chk, *nchk;
 
 	TAILQ_FOREACH_SAFE(chk, &asoc->control_send_queue, sctp_next, nchk) {
 		if (chk->rec.chunk_id.id == SCTP_COOKIE_ECHO) {
 			TAILQ_REMOVE(&asoc->control_send_queue, chk, sctp_next);
 			asoc->ctrl_queue_cnt--;
 			if (chk->data) {
 				sctp_m_freem(chk->data);
 				chk->data = NULL;
 			}
 			sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		}
 	}
 }
 
 void
 sctp_toss_old_asconf(struct sctp_tcb *stcb)
 {
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk, *nchk;
 	struct sctp_asconf_chunk *acp;
 
 	asoc = &stcb->asoc;
 	TAILQ_FOREACH_SAFE(chk, &asoc->asconf_send_queue, sctp_next, nchk) {
 		/* find SCTP_ASCONF chunk in queue */
 		if (chk->rec.chunk_id.id == SCTP_ASCONF) {
 			if (chk->data) {
 				acp = mtod(chk->data, struct sctp_asconf_chunk *);
 				if (SCTP_TSN_GT(ntohl(acp->serial_number), asoc->asconf_seq_out_acked)) {
 					/* Not Acked yet */
 					break;
 				}
 			}
 			TAILQ_REMOVE(&asoc->asconf_send_queue, chk, sctp_next);
 			asoc->ctrl_queue_cnt--;
 			if (chk->data) {
 				sctp_m_freem(chk->data);
 				chk->data = NULL;
 			}
 			sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		}
 	}
 }
 
 static void
 sctp_clean_up_datalist(struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     struct sctp_tmit_chunk **data_list,
     int bundle_at,
     struct sctp_nets *net)
 {
 	int i;
 	struct sctp_tmit_chunk *tp1;
 
 	for (i = 0; i < bundle_at; i++) {
 		/* off of the send queue */
 		TAILQ_REMOVE(&asoc->send_queue, data_list[i], sctp_next);
 		asoc->send_queue_cnt--;
 		if (i > 0) {
 			/*
 			 * Any chunk NOT 0 you zap the time chunk 0 gets
 			 * zapped or set based on if a RTO measurement is
 			 * needed.
 			 */
 			data_list[i]->do_rtt = 0;
 		}
 		/* record time */
 		data_list[i]->sent_rcv_time = net->last_sent_time;
 		data_list[i]->rec.data.cwnd_at_send = net->cwnd;
 		data_list[i]->rec.data.fast_retran_tsn = data_list[i]->rec.data.tsn;
 		if (data_list[i]->whoTo == NULL) {
 			data_list[i]->whoTo = net;
 			atomic_add_int(&net->ref_count, 1);
 		}
 		/* on to the sent queue */
 		tp1 = TAILQ_LAST(&asoc->sent_queue, sctpchunk_listhead);
 		if ((tp1) && SCTP_TSN_GT(tp1->rec.data.tsn, data_list[i]->rec.data.tsn)) {
 			struct sctp_tmit_chunk *tpp;
 
 			/* need to move back */
 	back_up_more:
 			tpp = TAILQ_PREV(tp1, sctpchunk_listhead, sctp_next);
 			if (tpp == NULL) {
 				TAILQ_INSERT_BEFORE(tp1, data_list[i], sctp_next);
 				goto all_done;
 			}
 			tp1 = tpp;
 			if (SCTP_TSN_GT(tp1->rec.data.tsn, data_list[i]->rec.data.tsn)) {
 				goto back_up_more;
 			}
 			TAILQ_INSERT_AFTER(&asoc->sent_queue, tp1, data_list[i], sctp_next);
 		} else {
 			TAILQ_INSERT_TAIL(&asoc->sent_queue,
 			    data_list[i],
 			    sctp_next);
 		}
 all_done:
 		/* This does not lower until the cum-ack passes it */
 		asoc->sent_queue_cnt++;
 		if ((asoc->peers_rwnd <= 0) &&
 		    (asoc->total_flight == 0) &&
 		    (bundle_at == 1)) {
 			/* Mark the chunk as being a window probe */
 			SCTP_STAT_INCR(sctps_windowprobed);
 		}
 #ifdef SCTP_AUDITING_ENABLED
 		sctp_audit_log(0xC2, 3);
 #endif
 		data_list[i]->sent = SCTP_DATAGRAM_SENT;
 		data_list[i]->snd_count = 1;
 		data_list[i]->rec.data.chunk_was_revoked = 0;
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FLIGHT_LOGGING_ENABLE) {
 			sctp_misc_ints(SCTP_FLIGHT_LOG_UP,
 			    data_list[i]->whoTo->flight_size,
 			    data_list[i]->book_size,
 			    (uint32_t)(uintptr_t)data_list[i]->whoTo,
 			    data_list[i]->rec.data.tsn);
 		}
 		sctp_flight_size_increase(data_list[i]);
 		sctp_total_flight_increase(stcb, data_list[i]);
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_RWND_ENABLE) {
 			sctp_log_rwnd(SCTP_DECREASE_PEER_RWND,
 			    asoc->peers_rwnd, data_list[i]->send_size, SCTP_BASE_SYSCTL(sctp_peer_chunk_oh));
 		}
 		asoc->peers_rwnd = sctp_sbspace_sub(asoc->peers_rwnd,
 		    (uint32_t)(data_list[i]->send_size + SCTP_BASE_SYSCTL(sctp_peer_chunk_oh)));
 		if (asoc->peers_rwnd < stcb->sctp_ep->sctp_ep.sctp_sws_sender) {
 			/* SWS sender side engages */
 			asoc->peers_rwnd = 0;
 		}
 	}
 	if (asoc->cc_functions.sctp_cwnd_update_packet_transmitted) {
 		(*asoc->cc_functions.sctp_cwnd_update_packet_transmitted) (stcb, net);
 	}
 }
 
 static void
 sctp_clean_up_ctl(struct sctp_tcb *stcb, struct sctp_association *asoc, int so_locked)
 {
 	struct sctp_tmit_chunk *chk, *nchk;
 
 	TAILQ_FOREACH_SAFE(chk, &asoc->control_send_queue, sctp_next, nchk) {
 		if ((chk->rec.chunk_id.id == SCTP_SELECTIVE_ACK) ||
 		    (chk->rec.chunk_id.id == SCTP_NR_SELECTIVE_ACK) ||	/* EY */
 		    (chk->rec.chunk_id.id == SCTP_HEARTBEAT_REQUEST) ||
 		    (chk->rec.chunk_id.id == SCTP_HEARTBEAT_ACK) ||
 		    (chk->rec.chunk_id.id == SCTP_FORWARD_CUM_TSN) ||
 		    (chk->rec.chunk_id.id == SCTP_SHUTDOWN) ||
 		    (chk->rec.chunk_id.id == SCTP_SHUTDOWN_ACK) ||
 		    (chk->rec.chunk_id.id == SCTP_OPERATION_ERROR) ||
 		    (chk->rec.chunk_id.id == SCTP_PACKET_DROPPED) ||
 		    (chk->rec.chunk_id.id == SCTP_COOKIE_ACK) ||
 		    (chk->rec.chunk_id.id == SCTP_ECN_CWR) ||
 		    (chk->rec.chunk_id.id == SCTP_ASCONF_ACK)) {
 			/* Stray chunks must be cleaned up */
 	clean_up_anyway:
 			TAILQ_REMOVE(&asoc->control_send_queue, chk, sctp_next);
 			asoc->ctrl_queue_cnt--;
 			if (chk->data) {
 				sctp_m_freem(chk->data);
 				chk->data = NULL;
 			}
 			if (chk->rec.chunk_id.id == SCTP_FORWARD_CUM_TSN) {
 				asoc->fwd_tsn_cnt--;
 			}
 			sctp_free_a_chunk(stcb, chk, so_locked);
 		} else if (chk->rec.chunk_id.id == SCTP_STREAM_RESET) {
 			/* special handling, we must look into the param */
 			if (chk != asoc->str_reset) {
 				goto clean_up_anyway;
 			}
 		}
 	}
 }
 
 static uint32_t
 sctp_can_we_split_this(struct sctp_tcb *stcb, uint32_t length,
     uint32_t space_left, uint32_t frag_point, int eeor_on)
 {
 	/*
 	 * Make a decision on if I should split a msg into multiple parts.
 	 * This is only asked of incomplete messages.
 	 */
 	if (eeor_on) {
 		/*
 		 * If we are doing EEOR we need to always send it if its the
 		 * entire thing, since it might be all the guy is putting in
 		 * the hopper.
 		 */
 		if (space_left >= length) {
 			/*-
 			 * If we have data outstanding,
 			 * we get another chance when the sack
 			 * arrives to transmit - wait for more data
 			 */
 			if (stcb->asoc.total_flight == 0) {
 				/*
 				 * If nothing is in flight, we zero the
 				 * packet counter.
 				 */
 				return (length);
 			}
 			return (0);
 
 		} else {
 			/* You can fill the rest */
 			return (space_left);
 		}
 	}
 	/*-
 	 * For those strange folk that make the send buffer
 	 * smaller than our fragmentation point, we can't
 	 * get a full msg in so we have to allow splitting.
 	 */
 	if (SCTP_SB_LIMIT_SND(stcb->sctp_socket) < frag_point) {
 		return (length);
 	}
 	if ((length <= space_left) ||
 	    ((length - space_left) < SCTP_BASE_SYSCTL(sctp_min_residual))) {
 		/* Sub-optimal residual don't split in non-eeor mode. */
 		return (0);
 	}
 	/*
 	 * If we reach here length is larger than the space_left. Do we wish
 	 * to split it for the sake of packet putting together?
 	 */
 	if (space_left >= min(SCTP_BASE_SYSCTL(sctp_min_split_point), frag_point)) {
 		/* Its ok to split it */
 		return (min(space_left, frag_point));
 	}
 	/* Nope, can't split */
 	return (0);
 }
 
 static uint32_t
 sctp_move_to_outqueue(struct sctp_tcb *stcb,
     struct sctp_nets *net,
     struct sctp_stream_out *strq,
     uint32_t space_left,
     uint32_t frag_point,
     int *giveup,
     int eeor_mode,
     int *bail,
     int so_locked)
 {
 	/* Move from the stream to the send_queue keeping track of the total */
 	struct sctp_association *asoc;
 	struct sctp_stream_queue_pending *sp;
 	struct sctp_tmit_chunk *chk;
 	struct sctp_data_chunk *dchkh = NULL;
 	struct sctp_idata_chunk *ndchkh = NULL;
 	uint32_t to_move, length;
 	int leading;
 	uint8_t rcv_flags = 0;
 	uint8_t some_taken;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	asoc = &stcb->asoc;
 one_more_time:
 	/* sa_ignore FREED_MEMORY */
 	sp = TAILQ_FIRST(&strq->outqueue);
 	if (sp == NULL) {
 		sp = TAILQ_FIRST(&strq->outqueue);
 		if (sp) {
 			goto one_more_time;
 		}
 		if ((sctp_is_feature_on(stcb->sctp_ep, SCTP_PCB_FLAGS_EXPLICIT_EOR) == 0) &&
 		    (stcb->asoc.idata_supported == 0) &&
 		    (strq->last_msg_incomplete)) {
 			SCTP_PRINTF("Huh? Stream:%d lm_in_c=%d but queue is NULL\n",
 			    strq->sid,
 			    strq->last_msg_incomplete);
 			strq->last_msg_incomplete = 0;
 		}
 		to_move = 0;
 		goto out_of;
 	}
 	if ((sp->msg_is_complete) && (sp->length == 0)) {
 		if (sp->sender_all_done) {
 			/*
 			 * We are doing deferred cleanup. Last time through
 			 * when we took all the data the sender_all_done was
 			 * not set.
 			 */
 			if ((sp->put_last_out == 0) && (sp->discard_rest == 0)) {
 				SCTP_PRINTF("Gak, put out entire msg with NO end!-1\n");
 				SCTP_PRINTF("sender_done:%d len:%d msg_comp:%d put_last_out:%d\n",
 				    sp->sender_all_done,
 				    sp->length,
 				    sp->msg_is_complete,
 				    sp->put_last_out);
 			}
 			atomic_subtract_int(&asoc->stream_queue_cnt, 1);
 			TAILQ_REMOVE(&strq->outqueue, sp, next);
 			stcb->asoc.ss_functions.sctp_ss_remove_from_stream(stcb, asoc, strq, sp);
 			if ((strq->state == SCTP_STREAM_RESET_PENDING) &&
 			    (strq->chunks_on_queues == 0) &&
 			    TAILQ_EMPTY(&strq->outqueue)) {
 				stcb->asoc.trigger_reset = 1;
 			}
 			if (sp->net) {
 				sctp_free_remote_addr(sp->net);
 				sp->net = NULL;
 			}
 			if (sp->data) {
 				sctp_m_freem(sp->data);
 				sp->data = NULL;
 			}
 			sctp_free_a_strmoq(stcb, sp, so_locked);
 			/* back to get the next msg */
 			goto one_more_time;
 		} else {
 			/*
 			 * sender just finished this but still holds a
 			 * reference
 			 */
 			*giveup = 1;
 			to_move = 0;
 			goto out_of;
 		}
 	} else {
 		/* is there some to get */
 		if (sp->length == 0) {
 			/* no */
 			*giveup = 1;
 			to_move = 0;
 			goto out_of;
 		} else if (sp->discard_rest) {
 			/* Whack down the size */
 			atomic_subtract_int(&stcb->asoc.total_output_queue_size, sp->length);
 			if ((stcb->sctp_socket != NULL) &&
 			    ((stcb->sctp_ep->sctp_flags & SCTP_PCB_FLAGS_TCPTYPE) ||
 			    (stcb->sctp_ep->sctp_flags & SCTP_PCB_FLAGS_IN_TCPPOOL))) {
 				atomic_subtract_int(&stcb->sctp_socket->so_snd.sb_cc, sp->length);
 			}
 			if (sp->data) {
 				sctp_m_freem(sp->data);
 				sp->data = NULL;
 				sp->tail_mbuf = NULL;
 			}
 			sp->length = 0;
 			sp->some_taken = 1;
 			*giveup = 1;
 			to_move = 0;
 			goto out_of;
 		}
 	}
 	some_taken = sp->some_taken;
 	length = sp->length;
 	if (sp->msg_is_complete) {
 		/* The message is complete */
 		to_move = min(length, frag_point);
 		if (to_move == length) {
 			/* All of it fits in the MTU */
 			if (sp->some_taken) {
 				rcv_flags |= SCTP_DATA_LAST_FRAG;
 			} else {
 				rcv_flags |= SCTP_DATA_NOT_FRAG;
 			}
 			sp->put_last_out = 1;
 			if (sp->sinfo_flags & SCTP_SACK_IMMEDIATELY) {
 				rcv_flags |= SCTP_DATA_SACK_IMMEDIATELY;
 			}
 		} else {
 			/* Not all of it fits, we fragment */
 			if (sp->some_taken == 0) {
 				rcv_flags |= SCTP_DATA_FIRST_FRAG;
 			}
 			sp->some_taken = 1;
 		}
 	} else {
 		to_move = sctp_can_we_split_this(stcb, length, space_left, frag_point, eeor_mode);
 		if (to_move > 0) {
 			if (to_move >= length) {
 				to_move = length;
 			}
 			if (sp->some_taken == 0) {
 				rcv_flags |= SCTP_DATA_FIRST_FRAG;
 				sp->some_taken = 1;
 			}
 		} else {
 			/* Nothing to take. */
 			*giveup = 1;
 			to_move = 0;
 			goto out_of;
 		}
 	}
 
 	/* If we reach here, we can copy out a chunk */
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* No chunk memory */
 		*giveup = 1;
 		to_move = 0;
 		goto out_of;
 	}
 	/*
 	 * Setup for unordered if needed by looking at the user sent info
 	 * flags.
 	 */
 	if (sp->sinfo_flags & SCTP_UNORDERED) {
 		rcv_flags |= SCTP_DATA_UNORDERED;
 	}
 	if (SCTP_BASE_SYSCTL(sctp_enable_sack_immediately) &&
 	    (sp->sinfo_flags & SCTP_EOF) == SCTP_EOF) {
 		rcv_flags |= SCTP_DATA_SACK_IMMEDIATELY;
 	}
 	/* clear out the chunk before setting up */
 	memset(chk, 0, sizeof(*chk));
 	chk->rec.data.rcv_flags = rcv_flags;
 
 	if (to_move >= length) {
 		/* we think we can steal the whole thing */
 		if (to_move < sp->length) {
 			/* bail, it changed */
 			goto dont_do_it;
 		}
 		chk->data = sp->data;
 		chk->last_mbuf = sp->tail_mbuf;
 		/* register the stealing */
 		sp->data = sp->tail_mbuf = NULL;
 	} else {
 		struct mbuf *m;
 
 dont_do_it:
 		chk->data = SCTP_M_COPYM(sp->data, 0, to_move, M_NOWAIT);
 		chk->last_mbuf = NULL;
 		if (chk->data == NULL) {
 			sp->some_taken = some_taken;
 			sctp_free_a_chunk(stcb, chk, so_locked);
 			*bail = 1;
 			to_move = 0;
 			goto out_of;
 		}
 #ifdef SCTP_MBUF_LOGGING
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 			sctp_log_mbc(chk->data, SCTP_MBUF_ICOPY);
 		}
 #endif
 		/* Pull off the data */
 		m_adj(sp->data, to_move);
 		/* Now lets work our way down and compact it */
 		m = sp->data;
 		while (m && (SCTP_BUF_LEN(m) == 0)) {
 			sp->data = SCTP_BUF_NEXT(m);
 			SCTP_BUF_NEXT(m) = NULL;
 			if (sp->tail_mbuf == m) {
 				/*-
 				 * Freeing tail? TSNH since
 				 * we supposedly were taking less
 				 * than the sp->length.
 				 */
 #ifdef INVARIANTS
 				panic("Huh, freeing tail? - TSNH");
 #else
 				SCTP_PRINTF("Huh, freeing tail? - TSNH\n");
 				sp->tail_mbuf = sp->data = NULL;
 				sp->length = 0;
 #endif
 			}
 			sctp_m_free(m);
 			m = sp->data;
 		}
 	}
 	if (SCTP_BUF_IS_EXTENDED(chk->data)) {
 		chk->copy_by_ref = 1;
 	} else {
 		chk->copy_by_ref = 0;
 	}
 	/*
 	 * get last_mbuf and counts of mb usage This is ugly but hopefully
 	 * its only one mbuf.
 	 */
 	if (chk->last_mbuf == NULL) {
 		chk->last_mbuf = chk->data;
 		while (SCTP_BUF_NEXT(chk->last_mbuf) != NULL) {
 			chk->last_mbuf = SCTP_BUF_NEXT(chk->last_mbuf);
 		}
 	}
 
 	if (to_move > length) {
 		/*- This should not happen either
 		 * since we always lower to_move to the size
 		 * of sp->length if its larger.
 		 */
 #ifdef INVARIANTS
 		panic("Huh, how can to_move be larger?");
 #else
 		SCTP_PRINTF("Huh, how can to_move be larger?\n");
 		sp->length = 0;
 #endif
 	} else {
 		atomic_subtract_int(&sp->length, to_move);
 	}
 	leading = SCTP_DATA_CHUNK_OVERHEAD(stcb);
 	if (M_LEADINGSPACE(chk->data) < leading) {
 		/* Not enough room for a chunk header, get some */
 		struct mbuf *m;
 
 		m = sctp_get_mbuf_for_msg(1, 0, M_NOWAIT, 1, MT_DATA);
 		if (m == NULL) {
 			/*
 			 * we're in trouble here. _PREPEND below will free
 			 * all the data if there is no leading space, so we
 			 * must put the data back and restore.
 			 */
 			if (sp->data == NULL) {
 				/* unsteal the data */
 				sp->data = chk->data;
 				sp->tail_mbuf = chk->last_mbuf;
 			} else {
 				struct mbuf *m_tmp;
 
 				/* reassemble the data */
 				m_tmp = sp->data;
 				sp->data = chk->data;
 				SCTP_BUF_NEXT(chk->last_mbuf) = m_tmp;
 			}
 			sp->some_taken = some_taken;
 			atomic_add_int(&sp->length, to_move);
 			chk->data = NULL;
 			*bail = 1;
 			sctp_free_a_chunk(stcb, chk, so_locked);
 			to_move = 0;
 			goto out_of;
 		} else {
 			SCTP_BUF_LEN(m) = 0;
 			SCTP_BUF_NEXT(m) = chk->data;
 			chk->data = m;
 			M_ALIGN(chk->data, 4);
 		}
 	}
 	SCTP_BUF_PREPEND(chk->data, SCTP_DATA_CHUNK_OVERHEAD(stcb), M_NOWAIT);
 	if (chk->data == NULL) {
 		/* HELP, TSNH since we assured it would not above? */
 #ifdef INVARIANTS
 		panic("prepend fails HELP?");
 #else
 		SCTP_PRINTF("prepend fails HELP?\n");
 		sctp_free_a_chunk(stcb, chk, so_locked);
 #endif
 		*bail = 1;
 		to_move = 0;
 		goto out_of;
 	}
 	sctp_snd_sb_alloc(stcb, SCTP_DATA_CHUNK_OVERHEAD(stcb));
 	chk->book_size = chk->send_size = (uint16_t)(to_move + SCTP_DATA_CHUNK_OVERHEAD(stcb));
 	chk->book_size_scale = 0;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->pad_inplace = 0;
 	chk->no_fr_allowed = 0;
 	if (stcb->asoc.idata_supported == 0) {
 		if (rcv_flags & SCTP_DATA_UNORDERED) {
 			/* Just use 0. The receiver ignores the values. */
 			chk->rec.data.mid = 0;
 		} else {
 			chk->rec.data.mid = strq->next_mid_ordered;
 			if (rcv_flags & SCTP_DATA_LAST_FRAG) {
 				strq->next_mid_ordered++;
 			}
 		}
 	} else {
 		if (rcv_flags & SCTP_DATA_UNORDERED) {
 			chk->rec.data.mid = strq->next_mid_unordered;
 			if (rcv_flags & SCTP_DATA_LAST_FRAG) {
 				strq->next_mid_unordered++;
 			}
 		} else {
 			chk->rec.data.mid = strq->next_mid_ordered;
 			if (rcv_flags & SCTP_DATA_LAST_FRAG) {
 				strq->next_mid_ordered++;
 			}
 		}
 	}
 	chk->rec.data.sid = sp->sid;
 	chk->rec.data.ppid = sp->ppid;
 	chk->rec.data.context = sp->context;
 	chk->rec.data.doing_fast_retransmit = 0;
 
 	chk->rec.data.timetodrop = sp->ts;
 	chk->flags = sp->act_flags;
 
 	if (sp->net) {
 		chk->whoTo = sp->net;
 		atomic_add_int(&chk->whoTo->ref_count, 1);
 	} else
 		chk->whoTo = NULL;
 
 	if (sp->holds_key_ref) {
 		chk->auth_keyid = sp->auth_keyid;
 		sctp_auth_key_acquire(stcb, chk->auth_keyid);
 		chk->holds_key_ref = 1;
 	}
 	stcb->asoc.ss_functions.sctp_ss_scheduled(stcb, net, asoc, strq, to_move);
 	chk->rec.data.tsn = atomic_fetchadd_int(&asoc->sending_seq, 1);
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_AT_SEND_2_OUTQ) {
 		sctp_misc_ints(SCTP_STRMOUT_LOG_SEND,
 		    (uint32_t)(uintptr_t)stcb, sp->length,
 		    (uint32_t)((chk->rec.data.sid << 16) | (0x0000ffff & chk->rec.data.mid)),
 		    chk->rec.data.tsn);
 	}
 	if (stcb->asoc.idata_supported == 0) {
 		dchkh = mtod(chk->data, struct sctp_data_chunk *);
 	} else {
 		ndchkh = mtod(chk->data, struct sctp_idata_chunk *);
 	}
 	/*
 	 * Put the rest of the things in place now. Size was done earlier in
 	 * previous loop prior to padding.
 	 */
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 #ifdef SCTP_ASOCLOG_OF_TSNS
 	if (asoc->tsn_out_at >= SCTP_TSN_LOG_SIZE) {
 		asoc->tsn_out_at = 0;
 		asoc->tsn_out_wrapped = 1;
 	}
 	asoc->out_tsnlog[asoc->tsn_out_at].tsn = chk->rec.data.tsn;
 	asoc->out_tsnlog[asoc->tsn_out_at].strm = chk->rec.data.sid;
 	asoc->out_tsnlog[asoc->tsn_out_at].seq = chk->rec.data.mid;
 	asoc->out_tsnlog[asoc->tsn_out_at].sz = chk->send_size;
 	asoc->out_tsnlog[asoc->tsn_out_at].flgs = chk->rec.data.rcv_flags;
 	asoc->out_tsnlog[asoc->tsn_out_at].stcb = (void *)stcb;
 	asoc->out_tsnlog[asoc->tsn_out_at].in_pos = asoc->tsn_out_at;
 	asoc->out_tsnlog[asoc->tsn_out_at].in_out = 2;
 	asoc->tsn_out_at++;
 #endif
 	if (stcb->asoc.idata_supported == 0) {
 		dchkh->ch.chunk_type = SCTP_DATA;
 		dchkh->ch.chunk_flags = chk->rec.data.rcv_flags;
 		dchkh->dp.tsn = htonl(chk->rec.data.tsn);
 		dchkh->dp.sid = htons(strq->sid);
 		dchkh->dp.ssn = htons((uint16_t)chk->rec.data.mid);
 		dchkh->dp.ppid = chk->rec.data.ppid;
 		dchkh->ch.chunk_length = htons(chk->send_size);
 	} else {
 		ndchkh->ch.chunk_type = SCTP_IDATA;
 		ndchkh->ch.chunk_flags = chk->rec.data.rcv_flags;
 		ndchkh->dp.tsn = htonl(chk->rec.data.tsn);
 		ndchkh->dp.sid = htons(strq->sid);
 		ndchkh->dp.reserved = htons(0);
 		ndchkh->dp.mid = htonl(chk->rec.data.mid);
 		if (sp->fsn == 0)
 			ndchkh->dp.ppid_fsn.ppid = chk->rec.data.ppid;
 		else
 			ndchkh->dp.ppid_fsn.fsn = htonl(sp->fsn);
 		sp->fsn++;
 		ndchkh->ch.chunk_length = htons(chk->send_size);
 	}
 	/* Now advance the chk->send_size by the actual pad needed. */
 	if (chk->send_size < SCTP_SIZE32(chk->book_size)) {
 		/* need a pad */
 		struct mbuf *lm;
 		int pads;
 
 		pads = SCTP_SIZE32(chk->book_size) - chk->send_size;
 		lm = sctp_pad_lastmbuf(chk->data, pads, chk->last_mbuf);
 		if (lm != NULL) {
 			chk->last_mbuf = lm;
 			chk->pad_inplace = 1;
 		}
 		chk->send_size += pads;
 	}
 	if (PR_SCTP_ENABLED(chk->flags)) {
 		asoc->pr_sctp_cnt++;
 	}
 	if (sp->msg_is_complete && (sp->length == 0) && (sp->sender_all_done)) {
 		/* All done pull and kill the message */
 		if (sp->put_last_out == 0) {
 			SCTP_PRINTF("Gak, put out entire msg with NO end!-2\n");
 			SCTP_PRINTF("sender_done:%d len:%d msg_comp:%d put_last_out:%d\n",
 			    sp->sender_all_done,
 			    sp->length,
 			    sp->msg_is_complete,
 			    sp->put_last_out);
 		}
 		atomic_subtract_int(&asoc->stream_queue_cnt, 1);
 		TAILQ_REMOVE(&strq->outqueue, sp, next);
 		stcb->asoc.ss_functions.sctp_ss_remove_from_stream(stcb, asoc, strq, sp);
 		if ((strq->state == SCTP_STREAM_RESET_PENDING) &&
 		    (strq->chunks_on_queues == 0) &&
 		    TAILQ_EMPTY(&strq->outqueue)) {
 			stcb->asoc.trigger_reset = 1;
 		}
 		if (sp->net) {
 			sctp_free_remote_addr(sp->net);
 			sp->net = NULL;
 		}
 		if (sp->data) {
 			sctp_m_freem(sp->data);
 			sp->data = NULL;
 		}
 		sctp_free_a_strmoq(stcb, sp, so_locked);
 	}
 	asoc->chunks_on_out_queue++;
 	strq->chunks_on_queues++;
 	TAILQ_INSERT_TAIL(&asoc->send_queue, chk, sctp_next);
 	asoc->send_queue_cnt++;
 out_of:
 	return (to_move);
 }
 
 static void
 sctp_fill_outqueue(struct sctp_tcb *stcb, struct sctp_nets *net,
     uint32_t frag_point, int eeor_mode, int *quit_now,
     int so_locked)
 {
 	struct sctp_association *asoc;
 	struct sctp_stream_out *strq;
 	uint32_t space_left, moved, total_moved;
 	int bail, giveup;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	asoc = &stcb->asoc;
 	total_moved = 0;
 	switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		space_left = net->mtu - SCTP_MIN_V4_OVERHEAD;
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		space_left = net->mtu - SCTP_MIN_OVERHEAD;
 		break;
 #endif
 	default:
 		/* TSNH */
 		space_left = net->mtu;
 		break;
 	}
 	/* Need an allowance for the data chunk header too */
 	space_left -= SCTP_DATA_CHUNK_OVERHEAD(stcb);
 
 	/* must make even word boundary */
 	space_left &= 0xfffffffc;
 	strq = stcb->asoc.ss_functions.sctp_ss_select_stream(stcb, net, asoc);
 	giveup = 0;
 	bail = 0;
 	while ((space_left > 0) && (strq != NULL)) {
 		moved = sctp_move_to_outqueue(stcb, net, strq, space_left,
 		    frag_point, &giveup, eeor_mode,
 		    &bail, so_locked);
 		if ((giveup != 0) || (bail != 0)) {
 			break;
 		}
 		strq = stcb->asoc.ss_functions.sctp_ss_select_stream(stcb, net, asoc);
 		total_moved += moved;
 		if (space_left >= moved) {
 			space_left -= moved;
 		} else {
 			space_left = 0;
 		}
 		if (space_left >= SCTP_DATA_CHUNK_OVERHEAD(stcb)) {
 			space_left -= SCTP_DATA_CHUNK_OVERHEAD(stcb);
 		} else {
 			space_left = 0;
 		}
 		space_left &= 0xfffffffc;
 	}
 	if (bail != 0)
 		*quit_now = 1;
 
 	stcb->asoc.ss_functions.sctp_ss_packet_done(stcb, net, asoc);
 
 	if (total_moved == 0) {
 		if ((stcb->asoc.sctp_cmt_on_off == 0) &&
 		    (net == stcb->asoc.primary_destination)) {
 			/* ran dry for primary network net */
 			SCTP_STAT_INCR(sctps_primary_randry);
 		} else if (stcb->asoc.sctp_cmt_on_off > 0) {
 			/* ran dry with CMT on */
 			SCTP_STAT_INCR(sctps_cmt_randry);
 		}
 	}
 }
 
 void
 sctp_fix_ecn_echo(struct sctp_association *asoc)
 {
 	struct sctp_tmit_chunk *chk;
 
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if (chk->rec.chunk_id.id == SCTP_ECN_ECHO) {
 			chk->sent = SCTP_DATAGRAM_UNSENT;
 		}
 	}
 }
 
 void
 sctp_move_chunks_from_net(struct sctp_tcb *stcb, struct sctp_nets *net)
 {
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk;
 	struct sctp_stream_queue_pending *sp;
 	unsigned int i;
 
 	if (net == NULL) {
 		return;
 	}
 	asoc = &stcb->asoc;
 	for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 		TAILQ_FOREACH(sp, &stcb->asoc.strmout[i].outqueue, next) {
 			if (sp->net == net) {
 				sctp_free_remote_addr(sp->net);
 				sp->net = NULL;
 			}
 		}
 	}
 	TAILQ_FOREACH(chk, &asoc->send_queue, sctp_next) {
 		if (chk->whoTo == net) {
 			sctp_free_remote_addr(chk->whoTo);
 			chk->whoTo = NULL;
 		}
 	}
 }
 
 int
 sctp_med_chunk_output(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     int *num_out,
     int *reason_code,
     int control_only, int from_where,
     struct timeval *now, int *now_filled,
     uint32_t frag_point, int so_locked)
 {
 	/**
 	 * Ok this is the generic chunk service queue. we must do the
 	 * following:
 	 * - Service the stream queue that is next, moving any
 	 *   message (note I must get a complete message i.e. FIRST/MIDDLE and
 	 *   LAST to the out queue in one pass) and assigning TSN's. This
 	 *   only applies though if the peer does not support NDATA. For NDATA
 	 *   chunks its ok to not send the entire message ;-)
 	 * - Check to see if the cwnd/rwnd allows any output, if so we go ahead and
 	 *   formulate and send the low level chunks. Making sure to combine
 	 *   any control in the control chunk queue also.
 	 */
 	struct sctp_nets *net, *start_at, *sack_goes_to = NULL, *old_start_at = NULL;
 	struct mbuf *outchain, *endoutchain;
 	struct sctp_tmit_chunk *chk, *nchk;
 
 	/* temp arrays for unlinking */
 	struct sctp_tmit_chunk *data_list[SCTP_MAX_DATA_BUNDLING];
 	int no_fragmentflg, error;
 	unsigned int max_rwnd_per_dest, max_send_per_dest;
 	int one_chunk, hbflag, skip_data_for_this_net;
 	int asconf, cookie, no_out_cnt;
 	int bundle_at, ctl_cnt, no_data_chunks, eeor_mode;
 	unsigned int mtu, r_mtu, omtu, mx_mtu, to_out;
 	int tsns_sent = 0;
 	uint32_t auth_offset;
 	struct sctp_auth_chunk *auth;
 	uint16_t auth_keyid;
 	int override_ok = 1;
 	int skip_fill_up = 0;
 	int data_auth_reqd = 0;
 
 	/*
 	 * JRS 5/14/07 - Add flag for whether a heartbeat is sent to the
 	 * destination.
 	 */
 	int quit_now = 0;
 	bool use_zero_crc;
 
 	*num_out = 0;
 	*reason_code = 0;
 	auth_keyid = stcb->asoc.authinfo.active_keyid;
 	if ((asoc->state & SCTP_STATE_SHUTDOWN_PENDING) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_RECEIVED) ||
 	    (sctp_is_feature_on(inp, SCTP_PCB_FLAGS_EXPLICIT_EOR))) {
 		eeor_mode = 1;
 	} else {
 		eeor_mode = 0;
 	}
 	ctl_cnt = no_out_cnt = asconf = cookie = 0;
 	/*
 	 * First lets prime the pump. For each destination, if there is room
 	 * in the flight size, attempt to pull an MTU's worth out of the
 	 * stream queues into the general send_queue
 	 */
 #ifdef SCTP_AUDITING_ENABLED
 	sctp_audit_log(0xC2, 2);
 #endif
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	hbflag = 0;
 	if (control_only)
 		no_data_chunks = 1;
 	else
 		no_data_chunks = 0;
 
 	/* Nothing to possible to send? */
 	if ((TAILQ_EMPTY(&asoc->control_send_queue) ||
 	    (asoc->ctrl_queue_cnt == stcb->asoc.ecn_echo_cnt_onq)) &&
 	    TAILQ_EMPTY(&asoc->asconf_send_queue) &&
 	    TAILQ_EMPTY(&asoc->send_queue) &&
 	    sctp_is_there_unsent_data(stcb, so_locked) == 0) {
 nothing_to_send:
 		*reason_code = 9;
 		return (0);
 	}
 	if (asoc->peers_rwnd == 0) {
 		/* No room in peers rwnd */
 		*reason_code = 1;
 		if (asoc->total_flight > 0) {
 			/* we are allowed one chunk in flight */
 			no_data_chunks = 1;
 		}
 	}
 	if (stcb->asoc.ecn_echo_cnt_onq) {
 		/* Record where a sack goes, if any */
 		if (no_data_chunks &&
 		    (asoc->ctrl_queue_cnt == stcb->asoc.ecn_echo_cnt_onq)) {
 			/* Nothing but ECNe to send - we don't do that */
 			goto nothing_to_send;
 		}
 		TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 			if ((chk->rec.chunk_id.id == SCTP_SELECTIVE_ACK) ||
 			    (chk->rec.chunk_id.id == SCTP_NR_SELECTIVE_ACK)) {
 				sack_goes_to = chk->whoTo;
 				break;
 			}
 		}
 	}
 	max_rwnd_per_dest = ((asoc->peers_rwnd + asoc->total_flight) / asoc->numnets);
 	if (stcb->sctp_socket)
 		max_send_per_dest = SCTP_SB_LIMIT_SND(stcb->sctp_socket) / asoc->numnets;
 	else
 		max_send_per_dest = 0;
 	if (no_data_chunks == 0) {
 		/* How many non-directed chunks are there? */
 		TAILQ_FOREACH(chk, &asoc->send_queue, sctp_next) {
 			if (chk->whoTo == NULL) {
 				/*
 				 * We already have non-directed chunks on
 				 * the queue, no need to do a fill-up.
 				 */
 				skip_fill_up = 1;
 				break;
 			}
 		}
 	}
 	if ((no_data_chunks == 0) &&
 	    (skip_fill_up == 0) &&
 	    (!stcb->asoc.ss_functions.sctp_ss_is_empty(stcb, asoc))) {
 		TAILQ_FOREACH(net, &asoc->nets, sctp_next) {
 			/*
 			 * This for loop we are in takes in each net, if
 			 * its's got space in cwnd and has data sent to it
 			 * (when CMT is off) then it calls
 			 * sctp_fill_outqueue for the net. This gets data on
 			 * the send queue for that network.
 			 *
 			 * In sctp_fill_outqueue TSN's are assigned and data
 			 * is copied out of the stream buffers. Note mostly
 			 * copy by reference (we hope).
 			 */
 			net->window_probe = 0;
 			if ((net != stcb->asoc.alternate) &&
 			    ((net->dest_state & SCTP_ADDR_PF) ||
 			    ((net->dest_state & SCTP_ADDR_REACHABLE) == 0) ||
 			    (net->dest_state & SCTP_ADDR_UNCONFIRMED))) {
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 					sctp_log_cwnd(stcb, net, 1,
 					    SCTP_CWND_LOG_FILL_OUTQ_CALLED);
 				}
 				continue;
 			}
 			if ((stcb->asoc.cc_functions.sctp_cwnd_new_transmission_begins) &&
 			    (net->flight_size == 0)) {
 				(*stcb->asoc.cc_functions.sctp_cwnd_new_transmission_begins) (stcb, net);
 			}
 			if (net->flight_size >= net->cwnd) {
 				/* skip this network, no room - can't fill */
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 					sctp_log_cwnd(stcb, net, 3,
 					    SCTP_CWND_LOG_FILL_OUTQ_CALLED);
 				}
 				continue;
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 				sctp_log_cwnd(stcb, net, 4, SCTP_CWND_LOG_FILL_OUTQ_CALLED);
 			}
 			sctp_fill_outqueue(stcb, net, frag_point, eeor_mode, &quit_now, so_locked);
 			if (quit_now) {
 				/* memory alloc failure */
 				no_data_chunks = 1;
 				break;
 			}
 		}
 	}
 	/* now service each destination and send out what we can for it */
 	/* Nothing to send? */
 	if (TAILQ_EMPTY(&asoc->control_send_queue) &&
 	    TAILQ_EMPTY(&asoc->asconf_send_queue) &&
 	    TAILQ_EMPTY(&asoc->send_queue)) {
 		*reason_code = 8;
 		return (0);
 	}
 
 	if (asoc->sctp_cmt_on_off > 0) {
 		/* get the last start point */
 		start_at = asoc->last_net_cmt_send_started;
 		if (start_at == NULL) {
 			/* null so to beginning */
 			start_at = TAILQ_FIRST(&asoc->nets);
 		} else {
 			start_at = TAILQ_NEXT(asoc->last_net_cmt_send_started, sctp_next);
 			if (start_at == NULL) {
 				start_at = TAILQ_FIRST(&asoc->nets);
 			}
 		}
 		asoc->last_net_cmt_send_started = start_at;
 	} else {
 		start_at = TAILQ_FIRST(&asoc->nets);
 	}
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if (chk->whoTo == NULL) {
 			if (asoc->alternate) {
 				chk->whoTo = asoc->alternate;
 			} else {
 				chk->whoTo = asoc->primary_destination;
 			}
 			atomic_add_int(&chk->whoTo->ref_count, 1);
 		}
 	}
 	old_start_at = NULL;
 again_one_more_time:
 	for (net = start_at; net != NULL; net = TAILQ_NEXT(net, sctp_next)) {
 		/* how much can we send? */
 		/* SCTPDBG("Examine for sending net:%x\n", (uint32_t)net); */
 		if (old_start_at && (old_start_at == net)) {
 			/* through list completely. */
 			break;
 		}
 		tsns_sent = 0xa;
 		if (TAILQ_EMPTY(&asoc->control_send_queue) &&
 		    TAILQ_EMPTY(&asoc->asconf_send_queue) &&
 		    (net->flight_size >= net->cwnd)) {
 			/*
 			 * Nothing on control or asconf and flight is full,
 			 * we can skip even in the CMT case.
 			 */
 			continue;
 		}
 		bundle_at = 0;
 		endoutchain = outchain = NULL;
 		auth = NULL;
 		auth_offset = 0;
 		no_fragmentflg = 1;
 		one_chunk = 0;
 		if (net->dest_state & SCTP_ADDR_UNCONFIRMED) {
 			skip_data_for_this_net = 1;
 		} else {
 			skip_data_for_this_net = 0;
 		}
 		switch (((struct sockaddr *)&net->ro._l_addr)->sa_family) {
 #ifdef INET
 		case AF_INET:
 			mtu = net->mtu - SCTP_MIN_V4_OVERHEAD;
 			break;
 #endif
 #ifdef INET6
 		case AF_INET6:
 			mtu = net->mtu - SCTP_MIN_OVERHEAD;
 			break;
 #endif
 		default:
 			/* TSNH */
 			mtu = net->mtu;
 			break;
 		}
 		mx_mtu = mtu;
 		to_out = 0;
 		if (mtu > asoc->peers_rwnd) {
 			if (asoc->total_flight > 0) {
 				/* We have a packet in flight somewhere */
 				r_mtu = asoc->peers_rwnd;
 			} else {
 				/* We are always allowed to send one MTU out */
 				one_chunk = 1;
 				r_mtu = mtu;
 			}
 		} else {
 			r_mtu = mtu;
 		}
 		error = 0;
 		/************************/
 		/* ASCONF transmission */
 		/************************/
 		/* Now first lets go through the asconf queue */
 		TAILQ_FOREACH_SAFE(chk, &asoc->asconf_send_queue, sctp_next, nchk) {
 			if (chk->rec.chunk_id.id != SCTP_ASCONF) {
 				continue;
 			}
 			if (chk->whoTo == NULL) {
 				if (asoc->alternate == NULL) {
 					if (asoc->primary_destination != net) {
 						break;
 					}
 				} else {
 					if (asoc->alternate != net) {
 						break;
 					}
 				}
 			} else {
 				if (chk->whoTo != net) {
 					break;
 				}
 			}
 			if (chk->data == NULL) {
 				break;
 			}
 			if (chk->sent != SCTP_DATAGRAM_UNSENT &&
 			    chk->sent != SCTP_DATAGRAM_RESEND) {
 				break;
 			}
 			/*
 			 * if no AUTH is yet included and this chunk
 			 * requires it, make sure to account for it.  We
 			 * don't apply the size until the AUTH chunk is
 			 * actually added below in case there is no room for
 			 * this chunk. NOTE: we overload the use of "omtu"
 			 * here
 			 */
 			if ((auth == NULL) &&
 			    sctp_auth_is_required_chunk(chk->rec.chunk_id.id,
 			    stcb->asoc.peer_auth_chunks)) {
 				omtu = sctp_get_auth_chunk_len(stcb->asoc.peer_hmac_id);
 			} else
 				omtu = 0;
 			/* Here we do NOT factor the r_mtu */
 			if ((chk->send_size < (int)(mtu - omtu)) ||
 			    (chk->flags & CHUNK_FLAGS_FRAGMENT_OK)) {
 				/*
 				 * We probably should glom the mbuf chain
 				 * from the chk->data for control but the
 				 * problem is it becomes yet one more level
 				 * of tracking to do if for some reason
 				 * output fails. Then I have got to
 				 * reconstruct the merged control chain.. el
 				 * yucko.. for now we take the easy way and
 				 * do the copy
 				 */
 				/*
 				 * Add an AUTH chunk, if chunk requires it
 				 * save the offset into the chain for AUTH
 				 */
 				if ((auth == NULL) &&
 				    (sctp_auth_is_required_chunk(chk->rec.chunk_id.id,
 				    stcb->asoc.peer_auth_chunks))) {
 					outchain = sctp_add_auth_chunk(outchain,
 					    &endoutchain,
 					    &auth,
 					    &auth_offset,
 					    stcb,
 					    chk->rec.chunk_id.id);
 					SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 				}
 				outchain = sctp_copy_mbufchain(chk->data, outchain, &endoutchain,
 				    (int)chk->rec.chunk_id.can_take_data,
 				    chk->send_size, chk->copy_by_ref);
 				if (outchain == NULL) {
 					*reason_code = 8;
 					SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 					return (ENOMEM);
 				}
 				SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 				/* update our MTU size */
 				if (mtu > (chk->send_size + omtu))
 					mtu -= (chk->send_size + omtu);
 				else
 					mtu = 0;
 				to_out += (chk->send_size + omtu);
 				/* Do clear IP_DF ? */
 				if (chk->flags & CHUNK_FLAGS_FRAGMENT_OK) {
 					no_fragmentflg = 0;
 				}
 				if (chk->rec.chunk_id.can_take_data)
 					chk->data = NULL;
 				/*
 				 * set hb flag since we can use these for
 				 * RTO
 				 */
 				hbflag = 1;
 				asconf = 1;
 				/*
 				 * should sysctl this: don't bundle data
 				 * with ASCONF since it requires AUTH
 				 */
 				no_data_chunks = 1;
 				chk->sent = SCTP_DATAGRAM_SENT;
 				if (chk->whoTo == NULL) {
 					chk->whoTo = net;
 					atomic_add_int(&net->ref_count, 1);
 				}
 				chk->snd_count++;
 				if (mtu == 0) {
 					/*
 					 * Ok we are out of room but we can
 					 * output without effecting the
 					 * flight size since this little guy
 					 * is a control only packet.
 					 */
 					sctp_timer_start(SCTP_TIMER_TYPE_ASCONF, inp, stcb, net);
 					/*
 					 * do NOT clear the asconf flag as
 					 * it is used to do appropriate
 					 * source address selection.
 					 */
 					if (*now_filled == 0) {
 						(void)SCTP_GETTIME_TIMEVAL(now);
 						*now_filled = 1;
 					}
 					net->last_sent_time = *now;
 					hbflag = 0;
 					if ((error = sctp_lowlevel_chunk_output(inp, stcb, net,
 					    (struct sockaddr *)&net->ro._l_addr,
 					    outchain, auth_offset, auth,
 					    stcb->asoc.authinfo.active_keyid,
 					    no_fragmentflg, 0, asconf,
 					    inp->sctp_lport, stcb->rport,
 					    htonl(stcb->asoc.peer_vtag),
 					    net->port, NULL,
 					    0, 0,
 					    false, so_locked))) {
 						/*
 						 * error, we could not
 						 * output
 						 */
 						SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 						if (from_where == 0) {
 							SCTP_STAT_INCR(sctps_lowlevelerrusr);
 						}
 						if (error == ENOBUFS) {
 							asoc->ifp_had_enobuf = 1;
 							SCTP_STAT_INCR(sctps_lowlevelerr);
 						}
 						/* error, could not output */
 						if (error == EHOSTUNREACH) {
 							/*
 							 * Destination went
 							 * unreachable
 							 * during this send
 							 */
 							sctp_move_chunks_from_net(stcb, net);
 						}
 						asconf = 0;
 						*reason_code = 7;
 						break;
 					} else {
 						asoc->ifp_had_enobuf = 0;
 					}
 					/*
 					 * increase the number we sent, if a
 					 * cookie is sent we don't tell them
 					 * any was sent out.
 					 */
 					outchain = endoutchain = NULL;
 					auth = NULL;
 					auth_offset = 0;
 					asconf = 0;
 					if (!no_out_cnt)
 						*num_out += ctl_cnt;
 					/* recalc a clean slate and setup */
 					switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 					case AF_INET:
 						mtu = net->mtu - SCTP_MIN_V4_OVERHEAD;
 						break;
 #endif
 #ifdef INET6
 					case AF_INET6:
 						mtu = net->mtu - SCTP_MIN_OVERHEAD;
 						break;
 #endif
 					default:
 						/* TSNH */
 						mtu = net->mtu;
 						break;
 					}
 					to_out = 0;
 					no_fragmentflg = 1;
 				}
 			}
 		}
 		if (error != 0) {
 			/* try next net */
 			continue;
 		}
 		/************************/
 		/* Control transmission */
 		/************************/
 		/* Now first lets go through the control queue */
 		TAILQ_FOREACH_SAFE(chk, &asoc->control_send_queue, sctp_next, nchk) {
 			if ((sack_goes_to) &&
 			    (chk->rec.chunk_id.id == SCTP_ECN_ECHO) &&
 			    (chk->whoTo != sack_goes_to)) {
 				/*
 				 * if we have a sack in queue, and we are
 				 * looking at an ecn echo that is NOT queued
 				 * to where the sack is going..
 				 */
 				if (chk->whoTo == net) {
 					/*
 					 * Don't transmit it to where its
 					 * going (current net)
 					 */
 					continue;
 				} else if (sack_goes_to == net) {
 					/*
 					 * But do transmit it to this
 					 * address
 					 */
 					goto skip_net_check;
 				}
 			}
 			if (chk->whoTo == NULL) {
 				if (asoc->alternate == NULL) {
 					if (asoc->primary_destination != net) {
 						continue;
 					}
 				} else {
 					if (asoc->alternate != net) {
 						continue;
 					}
 				}
 			} else {
 				if (chk->whoTo != net) {
 					continue;
 				}
 			}
 	skip_net_check:
 			if (chk->data == NULL) {
 				continue;
 			}
 			if (chk->sent != SCTP_DATAGRAM_UNSENT) {
 				/*
 				 * It must be unsent. Cookies and ASCONF's
 				 * hang around but there timers will force
 				 * when marked for resend.
 				 */
 				continue;
 			}
 			/*
 			 * if no AUTH is yet included and this chunk
 			 * requires it, make sure to account for it.  We
 			 * don't apply the size until the AUTH chunk is
 			 * actually added below in case there is no room for
 			 * this chunk. NOTE: we overload the use of "omtu"
 			 * here
 			 */
 			if ((auth == NULL) &&
 			    sctp_auth_is_required_chunk(chk->rec.chunk_id.id,
 			    stcb->asoc.peer_auth_chunks)) {
 				omtu = sctp_get_auth_chunk_len(stcb->asoc.peer_hmac_id);
 			} else
 				omtu = 0;
 			/* Here we do NOT factor the r_mtu */
 			if ((chk->send_size <= (int)(mtu - omtu)) ||
 			    (chk->flags & CHUNK_FLAGS_FRAGMENT_OK)) {
 				/*
 				 * We probably should glom the mbuf chain
 				 * from the chk->data for control but the
 				 * problem is it becomes yet one more level
 				 * of tracking to do if for some reason
 				 * output fails. Then I have got to
 				 * reconstruct the merged control chain.. el
 				 * yucko.. for now we take the easy way and
 				 * do the copy
 				 */
 				/*
 				 * Add an AUTH chunk, if chunk requires it
 				 * save the offset into the chain for AUTH
 				 */
 				if ((auth == NULL) &&
 				    (sctp_auth_is_required_chunk(chk->rec.chunk_id.id,
 				    stcb->asoc.peer_auth_chunks))) {
 					outchain = sctp_add_auth_chunk(outchain,
 					    &endoutchain,
 					    &auth,
 					    &auth_offset,
 					    stcb,
 					    chk->rec.chunk_id.id);
 					SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 				}
 				outchain = sctp_copy_mbufchain(chk->data, outchain, &endoutchain,
 				    (int)chk->rec.chunk_id.can_take_data,
 				    chk->send_size, chk->copy_by_ref);
 				if (outchain == NULL) {
 					*reason_code = 8;
 					SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 					return (ENOMEM);
 				}
 				SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 				/* update our MTU size */
 				if (mtu > (chk->send_size + omtu))
 					mtu -= (chk->send_size + omtu);
 				else
 					mtu = 0;
 				to_out += (chk->send_size + omtu);
 				/* Do clear IP_DF ? */
 				if (chk->flags & CHUNK_FLAGS_FRAGMENT_OK) {
 					no_fragmentflg = 0;
 				}
 				if (chk->rec.chunk_id.can_take_data)
 					chk->data = NULL;
 				/* Mark things to be removed, if needed */
 				if ((chk->rec.chunk_id.id == SCTP_SELECTIVE_ACK) ||
 				    (chk->rec.chunk_id.id == SCTP_NR_SELECTIVE_ACK) ||	/* EY */
 				    (chk->rec.chunk_id.id == SCTP_HEARTBEAT_REQUEST) ||
 				    (chk->rec.chunk_id.id == SCTP_HEARTBEAT_ACK) ||
 				    (chk->rec.chunk_id.id == SCTP_SHUTDOWN) ||
 				    (chk->rec.chunk_id.id == SCTP_SHUTDOWN_ACK) ||
 				    (chk->rec.chunk_id.id == SCTP_OPERATION_ERROR) ||
 				    (chk->rec.chunk_id.id == SCTP_COOKIE_ACK) ||
 				    (chk->rec.chunk_id.id == SCTP_ECN_CWR) ||
 				    (chk->rec.chunk_id.id == SCTP_PACKET_DROPPED) ||
 				    (chk->rec.chunk_id.id == SCTP_ASCONF_ACK)) {
 					if (chk->rec.chunk_id.id == SCTP_HEARTBEAT_REQUEST) {
 						hbflag = 1;
 					}
 					/* remove these chunks at the end */
 					if ((chk->rec.chunk_id.id == SCTP_SELECTIVE_ACK) ||
 					    (chk->rec.chunk_id.id == SCTP_NR_SELECTIVE_ACK)) {
 						/* turn off the timer */
 						if (SCTP_OS_TIMER_PENDING(&stcb->asoc.dack_timer.timer)) {
 							sctp_timer_stop(SCTP_TIMER_TYPE_RECV,
 							    inp, stcb, NULL,
 							    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_1);
 						}
 					}
 					ctl_cnt++;
 				} else {
 					/*
 					 * Other chunks, since they have
 					 * timers running (i.e. COOKIE) we
 					 * just "trust" that it gets sent or
 					 * retransmitted.
 					 */
 					ctl_cnt++;
 					if (chk->rec.chunk_id.id == SCTP_COOKIE_ECHO) {
 						cookie = 1;
 						no_out_cnt = 1;
 					} else if (chk->rec.chunk_id.id == SCTP_ECN_ECHO) {
 						/*
 						 * Increment ecne send count
 						 * here this means we may be
 						 * over-zealous in our
 						 * counting if the send
 						 * fails, but its the best
 						 * place to do it (we used
 						 * to do it in the queue of
 						 * the chunk, but that did
 						 * not tell how many times
 						 * it was sent.
 						 */
 						SCTP_STAT_INCR(sctps_sendecne);
 					}
 					chk->sent = SCTP_DATAGRAM_SENT;
 					if (chk->whoTo == NULL) {
 						chk->whoTo = net;
 						atomic_add_int(&net->ref_count, 1);
 					}
 					chk->snd_count++;
 				}
 				if (mtu == 0) {
 					/*
 					 * Ok we are out of room but we can
 					 * output without effecting the
 					 * flight size since this little guy
 					 * is a control only packet.
 					 */
 					use_zero_crc = asoc->zero_checksum == 2;
 					if (asconf) {
 						sctp_timer_start(SCTP_TIMER_TYPE_ASCONF, inp, stcb, net);
 						use_zero_crc = false;
 						/*
 						 * do NOT clear the asconf
 						 * flag as it is used to do
 						 * appropriate source
 						 * address selection.
 						 */
 					}
 					if (cookie) {
 						sctp_timer_start(SCTP_TIMER_TYPE_COOKIE, inp, stcb, net);
 						use_zero_crc = false;
 						cookie = 0;
 					}
 					/* Only HB or ASCONF advances time */
 					if (hbflag) {
 						if (*now_filled == 0) {
 							(void)SCTP_GETTIME_TIMEVAL(now);
 							*now_filled = 1;
 						}
 						net->last_sent_time = *now;
 						hbflag = 0;
 					}
 					if ((error = sctp_lowlevel_chunk_output(inp, stcb, net,
 					    (struct sockaddr *)&net->ro._l_addr,
 					    outchain,
 					    auth_offset, auth,
 					    stcb->asoc.authinfo.active_keyid,
 					    no_fragmentflg, 0, asconf,
 					    inp->sctp_lport, stcb->rport,
 					    htonl(stcb->asoc.peer_vtag),
 					    net->port, NULL,
 					    0, 0,
 					    use_zero_crc, so_locked))) {
 						/*
 						 * error, we could not
 						 * output
 						 */
 						SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 						if (from_where == 0) {
 							SCTP_STAT_INCR(sctps_lowlevelerrusr);
 						}
 						if (error == ENOBUFS) {
 							asoc->ifp_had_enobuf = 1;
 							SCTP_STAT_INCR(sctps_lowlevelerr);
 						}
 						if (error == EHOSTUNREACH) {
 							/*
 							 * Destination went
 							 * unreachable
 							 * during this send
 							 */
 							sctp_move_chunks_from_net(stcb, net);
 						}
 						asconf = 0;
 						*reason_code = 7;
 						break;
 					} else {
 						asoc->ifp_had_enobuf = 0;
 					}
 					/*
 					 * increase the number we sent, if a
 					 * cookie is sent we don't tell them
 					 * any was sent out.
 					 */
 					outchain = endoutchain = NULL;
 					auth = NULL;
 					auth_offset = 0;
 					asconf = 0;
 					if (!no_out_cnt)
 						*num_out += ctl_cnt;
 					/* recalc a clean slate and setup */
 					switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 					case AF_INET:
 						mtu = net->mtu - SCTP_MIN_V4_OVERHEAD;
 						break;
 #endif
 #ifdef INET6
 					case AF_INET6:
 						mtu = net->mtu - SCTP_MIN_OVERHEAD;
 						break;
 #endif
 					default:
 						/* TSNH */
 						mtu = net->mtu;
 						break;
 					}
 					to_out = 0;
 					no_fragmentflg = 1;
 				}
 			}
 		}
 		if (error != 0) {
 			/* try next net */
 			continue;
 		}
 		/* JRI: if dest is in PF state, do not send data to it */
 		if ((asoc->sctp_cmt_on_off > 0) &&
 		    (net != stcb->asoc.alternate) &&
 		    (net->dest_state & SCTP_ADDR_PF)) {
 			goto no_data_fill;
 		}
 		if (net->flight_size >= net->cwnd) {
 			goto no_data_fill;
 		}
 		if ((asoc->sctp_cmt_on_off > 0) &&
 		    (SCTP_BASE_SYSCTL(sctp_buffer_splitting) & SCTP_RECV_BUFFER_SPLITTING) &&
 		    (net->flight_size > max_rwnd_per_dest)) {
 			goto no_data_fill;
 		}
 		/*
 		 * We need a specific accounting for the usage of the send
 		 * buffer. We also need to check the number of messages per
 		 * net. For now, this is better than nothing and it disabled
 		 * by default...
 		 */
 		if ((asoc->sctp_cmt_on_off > 0) &&
 		    (SCTP_BASE_SYSCTL(sctp_buffer_splitting) & SCTP_SEND_BUFFER_SPLITTING) &&
 		    (max_send_per_dest > 0) &&
 		    (net->flight_size > max_send_per_dest)) {
 			goto no_data_fill;
 		}
 		/*********************/
 		/* Data transmission */
 		/*********************/
 		/*
 		 * if AUTH for DATA is required and no AUTH has been added
 		 * yet, account for this in the mtu now... if no data can be
 		 * bundled, this adjustment won't matter anyways since the
 		 * packet will be going out...
 		 */
 		data_auth_reqd = sctp_auth_is_required_chunk(SCTP_DATA,
 		    stcb->asoc.peer_auth_chunks);
 		if (data_auth_reqd && (auth == NULL)) {
 			mtu -= sctp_get_auth_chunk_len(stcb->asoc.peer_hmac_id);
 		}
 		/* now lets add any data within the MTU constraints */
 		switch (((struct sockaddr *)&net->ro._l_addr)->sa_family) {
 #ifdef INET
 		case AF_INET:
 			if (net->mtu > SCTP_MIN_V4_OVERHEAD)
 				omtu = net->mtu - SCTP_MIN_V4_OVERHEAD;
 			else
 				omtu = 0;
 			break;
 #endif
 #ifdef INET6
 		case AF_INET6:
 			if (net->mtu > SCTP_MIN_OVERHEAD)
 				omtu = net->mtu - SCTP_MIN_OVERHEAD;
 			else
 				omtu = 0;
 			break;
 #endif
 		default:
 			/* TSNH */
 			omtu = 0;
 			break;
 		}
 		if ((((SCTP_GET_STATE(stcb) == SCTP_STATE_OPEN) ||
 		    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_RECEIVED)) &&
 		    (skip_data_for_this_net == 0)) ||
 		    (cookie)) {
 			TAILQ_FOREACH_SAFE(chk, &asoc->send_queue, sctp_next, nchk) {
 				if (no_data_chunks) {
 					/* let only control go out */
 					*reason_code = 1;
 					break;
 				}
 				if (net->flight_size >= net->cwnd) {
 					/* skip this net, no room for data */
 					*reason_code = 2;
 					break;
 				}
 				if ((chk->whoTo != NULL) &&
 				    (chk->whoTo != net)) {
 					/* Don't send the chunk on this net */
 					continue;
 				}
 
 				if (asoc->sctp_cmt_on_off == 0) {
 					if ((asoc->alternate) &&
 					    (asoc->alternate != net) &&
 					    (chk->whoTo == NULL)) {
 						continue;
 					} else if ((net != asoc->primary_destination) &&
 						    (asoc->alternate == NULL) &&
 					    (chk->whoTo == NULL)) {
 						continue;
 					}
 				}
 				if ((chk->send_size > omtu) && ((chk->flags & CHUNK_FLAGS_FRAGMENT_OK) == 0)) {
 					/*-
 					 * strange, we have a chunk that is
 					 * to big for its destination and
 					 * yet no fragment ok flag.
 					 * Something went wrong when the
 					 * PMTU changed...we did not mark
 					 * this chunk for some reason?? I
 					 * will fix it here by letting IP
 					 * fragment it for now and printing
 					 * a warning. This really should not
 					 * happen ...
 					 */
 					SCTP_PRINTF("Warning chunk of %d bytes > mtu:%d and yet PMTU disc missed\n",
 					    chk->send_size, mtu);
 					chk->flags |= CHUNK_FLAGS_FRAGMENT_OK;
 				}
 				if (SCTP_BASE_SYSCTL(sctp_enable_sack_immediately) &&
 				    (asoc->state & SCTP_STATE_SHUTDOWN_PENDING)) {
 					struct sctp_data_chunk *dchkh;
 
 					dchkh = mtod(chk->data, struct sctp_data_chunk *);
 					dchkh->ch.chunk_flags |= SCTP_DATA_SACK_IMMEDIATELY;
 				}
 				if (((chk->send_size <= mtu) && (chk->send_size <= r_mtu)) ||
 				    ((chk->flags & CHUNK_FLAGS_FRAGMENT_OK) && (chk->send_size <= asoc->peers_rwnd))) {
 					/* ok we will add this one */
 
 					/*
 					 * Add an AUTH chunk, if chunk
 					 * requires it, save the offset into
 					 * the chain for AUTH
 					 */
 					if (data_auth_reqd) {
 						if (auth == NULL) {
 							outchain = sctp_add_auth_chunk(outchain,
 							    &endoutchain,
 							    &auth,
 							    &auth_offset,
 							    stcb,
 							    SCTP_DATA);
 							auth_keyid = chk->auth_keyid;
 							override_ok = 0;
 							SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 						} else if (override_ok) {
 							/*
 							 * use this data's
 							 * keyid
 							 */
 							auth_keyid = chk->auth_keyid;
 							override_ok = 0;
 						} else if (auth_keyid != chk->auth_keyid) {
 							/*
 							 * different keyid,
 							 * so done bundling
 							 */
 							break;
 						}
 					}
 					outchain = sctp_copy_mbufchain(chk->data, outchain, &endoutchain, 0,
 					    chk->send_size, chk->copy_by_ref);
 					if (outchain == NULL) {
 						SCTPDBG(SCTP_DEBUG_OUTPUT3, "No memory?\n");
 						if (!SCTP_OS_TIMER_PENDING(&net->rxt_timer.timer)) {
 							sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, net);
 						}
 						*reason_code = 3;
 						SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 						return (ENOMEM);
 					}
 					/* update our MTU size */
 					/* Do clear IP_DF ? */
 					if (chk->flags & CHUNK_FLAGS_FRAGMENT_OK) {
 						no_fragmentflg = 0;
 					}
 					/* unsigned subtraction of mtu */
 					if (mtu > chk->send_size)
 						mtu -= chk->send_size;
 					else
 						mtu = 0;
 					/* unsigned subtraction of r_mtu */
 					if (r_mtu > chk->send_size)
 						r_mtu -= chk->send_size;
 					else
 						r_mtu = 0;
 
 					to_out += chk->send_size;
 					if ((to_out > mx_mtu) && no_fragmentflg) {
 #ifdef INVARIANTS
 						panic("Exceeding mtu of %d out size is %d", mx_mtu, to_out);
 #else
 						SCTP_PRINTF("Exceeding mtu of %d out size is %d\n",
 						    mx_mtu, to_out);
 #endif
 					}
 					chk->window_probe = 0;
 					data_list[bundle_at++] = chk;
 					if (bundle_at >= SCTP_MAX_DATA_BUNDLING) {
 						break;
 					}
 					if (chk->sent == SCTP_DATAGRAM_UNSENT) {
 						if ((chk->rec.data.rcv_flags & SCTP_DATA_UNORDERED) == 0) {
 							SCTP_STAT_INCR_COUNTER64(sctps_outorderchunks);
 						} else {
 							SCTP_STAT_INCR_COUNTER64(sctps_outunorderchunks);
 						}
 						if (((chk->rec.data.rcv_flags & SCTP_DATA_LAST_FRAG) == SCTP_DATA_LAST_FRAG) &&
 						    ((chk->rec.data.rcv_flags & SCTP_DATA_FIRST_FRAG) == 0))
 							/*
 							 * Count number of
 							 * user msg's that
 							 * were fragmented
 							 * we do this by
 							 * counting when we
 							 * see a LAST
 							 * fragment only.
 							 */
 							SCTP_STAT_INCR_COUNTER64(sctps_fragusrmsgs);
 					}
 					if ((mtu == 0) || (r_mtu == 0) || (one_chunk)) {
 						if ((one_chunk) && (stcb->asoc.total_flight == 0)) {
 							data_list[0]->window_probe = 1;
 							net->window_probe = 1;
 						}
 						break;
 					}
 				} else {
 					/*
 					 * Must be sent in order of the
 					 * TSN's (on a network)
 					 */
 					break;
 				}
 			}	/* for (chunk gather loop for this net) */
 		}		/* if asoc.state OPEN */
 no_data_fill:
 		/* Is there something to send for this destination? */
 		if (outchain) {
 			/* We may need to start a control timer or two */
 			use_zero_crc = asoc->zero_checksum == 2;
 			if (asconf) {
 				sctp_timer_start(SCTP_TIMER_TYPE_ASCONF, inp,
 				    stcb, net);
 				use_zero_crc = false;
 				/*
 				 * do NOT clear the asconf flag as it is
 				 * used to do appropriate source address
 				 * selection.
 				 */
 			}
 			if (cookie) {
 				sctp_timer_start(SCTP_TIMER_TYPE_COOKIE, inp, stcb, net);
 				use_zero_crc = false;
 				cookie = 0;
 			}
 			/* must start a send timer if data is being sent */
 			if (bundle_at && (!SCTP_OS_TIMER_PENDING(&net->rxt_timer.timer))) {
 				/*
 				 * no timer running on this destination
 				 * restart it.
 				 */
 				sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, net);
 			}
 			if (bundle_at || hbflag) {
 				/* For data/asconf and hb set time */
 				if (*now_filled == 0) {
 					(void)SCTP_GETTIME_TIMEVAL(now);
 					*now_filled = 1;
 				}
 				net->last_sent_time = *now;
 			}
 			/* Now send it, if there is anything to send :> */
 			if ((error = sctp_lowlevel_chunk_output(inp,
 			    stcb,
 			    net,
 			    (struct sockaddr *)&net->ro._l_addr,
 			    outchain,
 			    auth_offset,
 			    auth,
 			    auth_keyid,
 			    no_fragmentflg,
 			    bundle_at,
 			    asconf,
 			    inp->sctp_lport, stcb->rport,
 			    htonl(stcb->asoc.peer_vtag),
 			    net->port, NULL,
 			    0, 0,
 			    use_zero_crc,
 			    so_locked))) {
 				/* error, we could not output */
 				SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 				if (from_where == 0) {
 					SCTP_STAT_INCR(sctps_lowlevelerrusr);
 				}
 				if (error == ENOBUFS) {
 					asoc->ifp_had_enobuf = 1;
 					SCTP_STAT_INCR(sctps_lowlevelerr);
 				}
 				if (error == EHOSTUNREACH) {
 					/*
 					 * Destination went unreachable
 					 * during this send
 					 */
 					sctp_move_chunks_from_net(stcb, net);
 				}
 				asconf = 0;
 				*reason_code = 6;
 				/*-
 				 * I add this line to be paranoid. As far as
 				 * I can tell the continue, takes us back to
 				 * the top of the for, but just to make sure
 				 * I will reset these again here.
 				 */
 				ctl_cnt = 0;
 				continue;	/* This takes us back to the
 						 * for() for the nets. */
 			} else {
 				asoc->ifp_had_enobuf = 0;
 			}
 			endoutchain = NULL;
 			auth = NULL;
 			auth_offset = 0;
 			asconf = 0;
 			if (!no_out_cnt) {
 				*num_out += (ctl_cnt + bundle_at);
 			}
 			if (bundle_at) {
 				/* setup for a RTO measurement */
 				tsns_sent = data_list[0]->rec.data.tsn;
 				/* fill time if not already filled */
 				if (*now_filled == 0) {
 					(void)SCTP_GETTIME_TIMEVAL(&asoc->time_last_sent);
 					*now_filled = 1;
 					*now = asoc->time_last_sent;
 				} else {
 					asoc->time_last_sent = *now;
 				}
 				if (net->rto_needed) {
 					data_list[0]->do_rtt = 1;
 					net->rto_needed = 0;
 				}
 				SCTP_STAT_INCR_BY(sctps_senddata, bundle_at);
 				sctp_clean_up_datalist(stcb, asoc, data_list, bundle_at, net);
 			}
 			if (one_chunk) {
 				break;
 			}
 		}
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 			sctp_log_cwnd(stcb, net, tsns_sent, SCTP_CWND_LOG_FROM_SEND);
 		}
 	}
 	if (old_start_at == NULL) {
 		old_start_at = start_at;
 		start_at = TAILQ_FIRST(&asoc->nets);
 		if (old_start_at)
 			goto again_one_more_time;
 	}
 
 	/*
 	 * At the end there should be no NON timed chunks hanging on this
 	 * queue.
 	 */
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 		sctp_log_cwnd(stcb, net, *num_out, SCTP_CWND_LOG_FROM_SEND);
 	}
 	if ((*num_out == 0) && (*reason_code == 0)) {
 		*reason_code = 4;
 	} else {
 		*reason_code = 5;
 	}
 	sctp_clean_up_ctl(stcb, asoc, so_locked);
 	return (0);
 }
 
 void
 sctp_queue_op_err(struct sctp_tcb *stcb, struct mbuf *op_err)
 {
 	/*-
 	 * Prepend a OPERATIONAL_ERROR chunk header and put on the end of
 	 * the control chunk queue.
 	 */
 	struct sctp_chunkhdr *hdr;
 	struct sctp_tmit_chunk *chk;
 	struct mbuf *mat, *last_mbuf;
 	uint32_t chunk_length;
 	uint16_t padding_length;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	SCTP_BUF_PREPEND(op_err, sizeof(struct sctp_chunkhdr), M_NOWAIT);
 	if (op_err == NULL) {
 		return;
 	}
 	last_mbuf = NULL;
 	chunk_length = 0;
 	for (mat = op_err; mat != NULL; mat = SCTP_BUF_NEXT(mat)) {
 		chunk_length += SCTP_BUF_LEN(mat);
 		if (SCTP_BUF_NEXT(mat) == NULL) {
 			last_mbuf = mat;
 		}
 	}
 	if (chunk_length > SCTP_MAX_CHUNK_LENGTH) {
 		sctp_m_freem(op_err);
 		return;
 	}
 	padding_length = chunk_length % 4;
 	if (padding_length != 0) {
 		padding_length = 4 - padding_length;
 	}
 	if (padding_length != 0) {
 		if (sctp_add_pad_tombuf(last_mbuf, padding_length) == NULL) {
 			sctp_m_freem(op_err);
 			return;
 		}
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(op_err);
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_OPERATION_ERROR;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->send_size = (uint16_t)chunk_length;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->data = op_err;
 	chk->whoTo = NULL;
 	hdr = mtod(op_err, struct sctp_chunkhdr *);
 	hdr->chunk_type = SCTP_OPERATION_ERROR;
 	hdr->chunk_flags = 0;
 	hdr->chunk_length = htons(chk->send_size);
 	TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 }
 
 int
 sctp_send_cookie_echo(struct mbuf *m,
     int offset, int limit,
     struct sctp_tcb *stcb,
     struct sctp_nets *net)
 {
 	/*-
 	 * pull out the cookie and put it at the front of the control chunk
 	 * queue.
 	 */
 	int at;
 	struct mbuf *cookie;
 	struct sctp_paramhdr param, *phdr;
 	struct sctp_chunkhdr *hdr;
 	struct sctp_tmit_chunk *chk;
 	uint16_t ptype, plen;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	/* First find the cookie in the param area */
 	cookie = NULL;
 	at = offset + sizeof(struct sctp_init_chunk);
 	for (;;) {
 		phdr = sctp_get_next_param(m, at, &param, sizeof(param));
 		if (phdr == NULL) {
 			return (-3);
 		}
 		ptype = ntohs(phdr->param_type);
 		plen = ntohs(phdr->param_length);
 		if (plen < sizeof(struct sctp_paramhdr)) {
 			return (-6);
 		}
 		if (ptype == SCTP_STATE_COOKIE) {
 			int pad;
 
 			/* found the cookie */
 			if (at + plen > limit) {
 				return (-7);
 			}
 			cookie = SCTP_M_COPYM(m, at, plen, M_NOWAIT);
 			if (cookie == NULL) {
 				/* No memory */
 				return (-2);
 			}
 			if ((pad = (plen % 4)) > 0) {
 				pad = 4 - pad;
 			}
 			if (pad > 0) {
 				if (sctp_pad_lastmbuf(cookie, pad, NULL) == NULL) {
 					return (-8);
 				}
 			}
 #ifdef SCTP_MBUF_LOGGING
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 				sctp_log_mbc(cookie, SCTP_MBUF_ICOPY);
 			}
 #endif
 			break;
 		}
 		at += SCTP_SIZE32(plen);
 	}
 	/* ok, we got the cookie lets change it into a cookie echo chunk */
 	/* first the change from param to cookie */
 	hdr = mtod(cookie, struct sctp_chunkhdr *);
 	hdr->chunk_type = SCTP_COOKIE_ECHO;
 	hdr->chunk_flags = 0;
 	/* get the chunk stuff now and place it in the FRONT of the queue */
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(cookie);
 		return (-5);
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_COOKIE_ECHO;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = CHUNK_FLAGS_FRAGMENT_OK;
 	chk->send_size = SCTP_SIZE32(plen);
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->data = cookie;
 	chk->whoTo = net;
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	TAILQ_INSERT_HEAD(&chk->asoc->control_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 	return (0);
 }
 
 void
 sctp_send_heartbeat_ack(struct sctp_tcb *stcb,
     struct mbuf *m,
     int offset,
     int chk_length,
     struct sctp_nets *net)
 {
 	/*
 	 * take a HB request and make it into a HB ack and send it.
 	 */
 	struct mbuf *outchain;
 	struct sctp_chunkhdr *chdr;
 	struct sctp_tmit_chunk *chk;
 
 	if (net == NULL)
 		/* must have a net pointer */
 		return;
 
 	outchain = SCTP_M_COPYM(m, offset, chk_length, M_NOWAIT);
 	if (outchain == NULL) {
 		/* gak out of memory */
 		return;
 	}
 #ifdef SCTP_MBUF_LOGGING
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 		sctp_log_mbc(outchain, SCTP_MBUF_ICOPY);
 	}
 #endif
 	chdr = mtod(outchain, struct sctp_chunkhdr *);
 	chdr->chunk_type = SCTP_HEARTBEAT_ACK;
 	chdr->chunk_flags = 0;
 	if (chk_length % 4 != 0) {
 		sctp_pad_lastmbuf(outchain, 4 - (chk_length % 4), NULL);
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(outchain);
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_HEARTBEAT_ACK;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	chk->send_size = chk_length;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->data = outchain;
 	chk->whoTo = net;
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 }
 
 void
 sctp_send_cookie_ack(struct sctp_tcb *stcb)
 {
 	/* formulate and queue a cookie-ack back to sender */
 	struct mbuf *cookie_ack;
 	struct sctp_chunkhdr *hdr;
 	struct sctp_tmit_chunk *chk;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	cookie_ack = sctp_get_mbuf_for_msg(sizeof(struct sctp_chunkhdr), 0, M_NOWAIT, 1, MT_HEADER);
 	if (cookie_ack == NULL) {
 		/* no mbuf's */
 		return;
 	}
 	SCTP_BUF_RESV_UF(cookie_ack, SCTP_MIN_OVERHEAD);
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(cookie_ack);
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_COOKIE_ACK;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	chk->send_size = sizeof(struct sctp_chunkhdr);
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->data = cookie_ack;
 	if (chk->asoc->last_control_chunk_from != NULL) {
 		chk->whoTo = chk->asoc->last_control_chunk_from;
 		atomic_add_int(&chk->whoTo->ref_count, 1);
 	} else {
 		chk->whoTo = NULL;
 	}
 	hdr = mtod(cookie_ack, struct sctp_chunkhdr *);
 	hdr->chunk_type = SCTP_COOKIE_ACK;
 	hdr->chunk_flags = 0;
 	hdr->chunk_length = htons(chk->send_size);
 	SCTP_BUF_LEN(cookie_ack) = chk->send_size;
 	TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 	return;
 }
 
 void
 sctp_send_shutdown_ack(struct sctp_tcb *stcb, struct sctp_nets *net)
 {
 	/* formulate and queue a SHUTDOWN-ACK back to the sender */
 	struct mbuf *m_shutdown_ack;
 	struct sctp_shutdown_ack_chunk *ack_cp;
 	struct sctp_tmit_chunk *chk;
 
 	m_shutdown_ack = sctp_get_mbuf_for_msg(sizeof(struct sctp_shutdown_ack_chunk), 0, M_NOWAIT, 1, MT_HEADER);
 	if (m_shutdown_ack == NULL) {
 		/* no mbuf's */
 		return;
 	}
 	SCTP_BUF_RESV_UF(m_shutdown_ack, SCTP_MIN_OVERHEAD);
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(m_shutdown_ack);
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_SHUTDOWN_ACK;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	chk->send_size = sizeof(struct sctp_chunkhdr);
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->data = m_shutdown_ack;
 	chk->whoTo = net;
 	if (chk->whoTo) {
 		atomic_add_int(&chk->whoTo->ref_count, 1);
 	}
 	ack_cp = mtod(m_shutdown_ack, struct sctp_shutdown_ack_chunk *);
 	ack_cp->ch.chunk_type = SCTP_SHUTDOWN_ACK;
 	ack_cp->ch.chunk_flags = 0;
 	ack_cp->ch.chunk_length = htons(chk->send_size);
 	SCTP_BUF_LEN(m_shutdown_ack) = chk->send_size;
 	TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 	return;
 }
 
 void
 sctp_send_shutdown(struct sctp_tcb *stcb, struct sctp_nets *net)
 {
 	/* formulate and queue a SHUTDOWN to the sender */
 	struct mbuf *m_shutdown;
 	struct sctp_shutdown_chunk *shutdown_cp;
 	struct sctp_tmit_chunk *chk;
 
 	TAILQ_FOREACH(chk, &stcb->asoc.control_send_queue, sctp_next) {
 		if (chk->rec.chunk_id.id == SCTP_SHUTDOWN) {
 			/* We already have a SHUTDOWN queued. Reuse it. */
 			if (chk->whoTo) {
 				sctp_free_remote_addr(chk->whoTo);
 				chk->whoTo = NULL;
 			}
 			break;
 		}
 	}
 	if (chk == NULL) {
 		m_shutdown = sctp_get_mbuf_for_msg(sizeof(struct sctp_shutdown_chunk), 0, M_NOWAIT, 1, MT_HEADER);
 		if (m_shutdown == NULL) {
 			/* no mbuf's */
 			return;
 		}
 		SCTP_BUF_RESV_UF(m_shutdown, SCTP_MIN_OVERHEAD);
 		sctp_alloc_a_chunk(stcb, chk);
 		if (chk == NULL) {
 			/* no memory */
 			sctp_m_freem(m_shutdown);
 			return;
 		}
 		chk->copy_by_ref = 0;
 		chk->rec.chunk_id.id = SCTP_SHUTDOWN;
 		chk->rec.chunk_id.can_take_data = 1;
 		chk->flags = 0;
 		chk->send_size = sizeof(struct sctp_shutdown_chunk);
 		chk->sent = SCTP_DATAGRAM_UNSENT;
 		chk->snd_count = 0;
 		chk->asoc = &stcb->asoc;
 		chk->data = m_shutdown;
 		chk->whoTo = net;
 		if (chk->whoTo) {
 			atomic_add_int(&chk->whoTo->ref_count, 1);
 		}
 		shutdown_cp = mtod(m_shutdown, struct sctp_shutdown_chunk *);
 		shutdown_cp->ch.chunk_type = SCTP_SHUTDOWN;
 		shutdown_cp->ch.chunk_flags = 0;
 		shutdown_cp->ch.chunk_length = htons(chk->send_size);
 		shutdown_cp->cumulative_tsn_ack = htonl(stcb->asoc.cumulative_tsn);
 		SCTP_BUF_LEN(m_shutdown) = chk->send_size;
 		TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 		chk->asoc->ctrl_queue_cnt++;
 	} else {
 		TAILQ_REMOVE(&stcb->asoc.control_send_queue, chk, sctp_next);
 		chk->whoTo = net;
 		if (chk->whoTo) {
 			atomic_add_int(&chk->whoTo->ref_count, 1);
 		}
 		shutdown_cp = mtod(chk->data, struct sctp_shutdown_chunk *);
 		shutdown_cp->cumulative_tsn_ack = htonl(stcb->asoc.cumulative_tsn);
 		TAILQ_INSERT_TAIL(&stcb->asoc.control_send_queue, chk, sctp_next);
 	}
 	return;
 }
 
 void
 sctp_send_asconf(struct sctp_tcb *stcb, struct sctp_nets *net, int addr_locked)
 {
 	/*
 	 * formulate and queue an ASCONF to the peer. ASCONF parameters
 	 * should be queued on the assoc queue.
 	 */
 	struct sctp_tmit_chunk *chk;
 	struct mbuf *m_asconf;
 	int len;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	if ((!TAILQ_EMPTY(&stcb->asoc.asconf_send_queue)) &&
 	    (!sctp_is_feature_on(stcb->sctp_ep, SCTP_PCB_FLAGS_MULTIPLE_ASCONFS))) {
 		/* can't send a new one if there is one in flight already */
 		return;
 	}
 
 	/* compose an ASCONF chunk, maximum length is PMTU */
 	m_asconf = sctp_compose_asconf(stcb, &len, addr_locked);
 	if (m_asconf == NULL) {
 		return;
 	}
 
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		/* no memory */
 		sctp_m_freem(m_asconf);
 		return;
 	}
 
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_ASCONF;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = CHUNK_FLAGS_FRAGMENT_OK;
 	chk->data = m_asconf;
 	chk->send_size = len;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->asoc = &stcb->asoc;
 	chk->whoTo = net;
 	if (chk->whoTo) {
 		atomic_add_int(&chk->whoTo->ref_count, 1);
 	}
 	TAILQ_INSERT_TAIL(&chk->asoc->asconf_send_queue, chk, sctp_next);
 	chk->asoc->ctrl_queue_cnt++;
 	return;
 }
 
 void
 sctp_send_asconf_ack(struct sctp_tcb *stcb)
 {
 	/*
 	 * formulate and queue a asconf-ack back to sender. the asconf-ack
 	 * must be stored in the tcb.
 	 */
 	struct sctp_tmit_chunk *chk;
 	struct sctp_asconf_ack *ack, *latest_ack;
 	struct mbuf *m_ack;
 	struct sctp_nets *net = NULL;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	/* Get the latest ASCONF-ACK */
 	latest_ack = TAILQ_LAST(&stcb->asoc.asconf_ack_sent, sctp_asconf_ackhead);
 	if (latest_ack == NULL) {
 		return;
 	}
 	if (latest_ack->last_sent_to != NULL &&
 	    latest_ack->last_sent_to == stcb->asoc.last_control_chunk_from) {
 		/* we're doing a retransmission */
 		net = sctp_find_alternate_net(stcb, stcb->asoc.last_control_chunk_from, 0);
 		if (net == NULL) {
 			/* no alternate */
 			if (stcb->asoc.last_control_chunk_from == NULL) {
 				if (stcb->asoc.alternate) {
 					net = stcb->asoc.alternate;
 				} else {
 					net = stcb->asoc.primary_destination;
 				}
 			} else {
 				net = stcb->asoc.last_control_chunk_from;
 			}
 		}
 	} else {
 		/* normal case */
 		if (stcb->asoc.last_control_chunk_from == NULL) {
 			if (stcb->asoc.alternate) {
 				net = stcb->asoc.alternate;
 			} else {
 				net = stcb->asoc.primary_destination;
 			}
 		} else {
 			net = stcb->asoc.last_control_chunk_from;
 		}
 	}
 	latest_ack->last_sent_to = net;
 
 	TAILQ_FOREACH(ack, &stcb->asoc.asconf_ack_sent, next) {
 		if (ack->data == NULL) {
 			continue;
 		}
 
 		/* copy the asconf_ack */
 		m_ack = SCTP_M_COPYM(ack->data, 0, M_COPYALL, M_NOWAIT);
 		if (m_ack == NULL) {
 			/* couldn't copy it */
 			return;
 		}
 #ifdef SCTP_MBUF_LOGGING
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_MBUF_LOGGING_ENABLE) {
 			sctp_log_mbc(m_ack, SCTP_MBUF_ICOPY);
 		}
 #endif
 
 		sctp_alloc_a_chunk(stcb, chk);
 		if (chk == NULL) {
 			/* no memory */
 			if (m_ack)
 				sctp_m_freem(m_ack);
 			return;
 		}
 		chk->copy_by_ref = 0;
 		chk->rec.chunk_id.id = SCTP_ASCONF_ACK;
 		chk->rec.chunk_id.can_take_data = 1;
 		chk->flags = CHUNK_FLAGS_FRAGMENT_OK;
 		chk->whoTo = net;
 		if (chk->whoTo) {
 			atomic_add_int(&chk->whoTo->ref_count, 1);
 		}
 		chk->data = m_ack;
 		chk->send_size = ack->len;
 		chk->sent = SCTP_DATAGRAM_UNSENT;
 		chk->snd_count = 0;
 		chk->asoc = &stcb->asoc;
 
 		TAILQ_INSERT_TAIL(&chk->asoc->control_send_queue, chk, sctp_next);
 		chk->asoc->ctrl_queue_cnt++;
 	}
 	return;
 }
 
 static int
 sctp_chunk_retransmission(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     int *cnt_out, struct timeval *now, int *now_filled, int *fr_done, int so_locked)
 {
 	/*-
 	 * send out one MTU of retransmission. If fast_retransmit is
 	 * happening we ignore the cwnd. Otherwise we obey the cwnd and
 	 * rwnd. For a Cookie or Asconf in the control chunk queue we
 	 * retransmit them by themselves.
 	 *
 	 * For data chunks we will pick out the lowest TSN's in the sent_queue
 	 * marked for resend and bundle them all together (up to a MTU of
 	 * destination). The address to send to should have been
 	 * selected/changed where the retransmission was marked (i.e. in FR
 	 * or t3-timeout routines).
 	 */
 	struct sctp_tmit_chunk *data_list[SCTP_MAX_DATA_BUNDLING];
 	struct sctp_tmit_chunk *chk, *fwd;
 	struct mbuf *m, *endofchain;
 	struct sctp_nets *net = NULL;
 	uint32_t tsns_sent = 0;
 	int no_fragmentflg, bundle_at;
 	unsigned int mtu;
 	int error, i, one_chunk, fwd_tsn, ctl_cnt, tmr_started;
 	struct sctp_auth_chunk *auth = NULL;
 	uint32_t auth_offset = 0;
 	uint16_t auth_keyid;
 	int override_ok = 1;
 	int data_auth_reqd = 0;
 	uint32_t dmtu = 0;
 	bool use_zero_crc;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	tmr_started = ctl_cnt = 0;
 	no_fragmentflg = 1;
 	fwd_tsn = 0;
 	*cnt_out = 0;
 	fwd = NULL;
 	endofchain = m = NULL;
 	auth_keyid = stcb->asoc.authinfo.active_keyid;
 #ifdef SCTP_AUDITING_ENABLED
 	sctp_audit_log(0xC3, 1);
 #endif
 	if ((TAILQ_EMPTY(&asoc->sent_queue)) &&
 	    (TAILQ_EMPTY(&asoc->control_send_queue))) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT1, "SCTP hits empty queue with cnt set to %d?\n",
 		    asoc->sent_queue_retran_cnt);
 		asoc->sent_queue_cnt = 0;
 		asoc->sent_queue_cnt_removeable = 0;
 		/* send back 0/0 so we enter normal transmission */
 		*cnt_out = 0;
 		return (0);
 	}
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if ((chk->rec.chunk_id.id == SCTP_COOKIE_ECHO) ||
 		    (chk->rec.chunk_id.id == SCTP_STREAM_RESET) ||
 		    (chk->rec.chunk_id.id == SCTP_FORWARD_CUM_TSN)) {
 			if (chk->sent != SCTP_DATAGRAM_RESEND) {
 				continue;
 			}
 			if (chk->rec.chunk_id.id == SCTP_STREAM_RESET) {
 				if (chk != asoc->str_reset) {
 					/*
 					 * not eligible for retran if its
 					 * not ours
 					 */
 					continue;
 				}
 			}
 			ctl_cnt++;
 			if (chk->rec.chunk_id.id == SCTP_FORWARD_CUM_TSN) {
 				fwd_tsn = 1;
 			}
 			/*
 			 * Add an AUTH chunk, if chunk requires it save the
 			 * offset into the chain for AUTH
 			 */
 			if ((auth == NULL) &&
 			    (sctp_auth_is_required_chunk(chk->rec.chunk_id.id,
 			    stcb->asoc.peer_auth_chunks))) {
 				m = sctp_add_auth_chunk(m, &endofchain,
 				    &auth, &auth_offset,
 				    stcb,
 				    chk->rec.chunk_id.id);
 				SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 			}
 			m = sctp_copy_mbufchain(chk->data, m, &endofchain, 0, chk->send_size, chk->copy_by_ref);
 			break;
 		}
 	}
 	one_chunk = 0;
 	/* do we have control chunks to retransmit? */
 	if (m != NULL) {
 		/* Start a timer no matter if we succeed or fail */
 		use_zero_crc = asoc->zero_checksum == 2;
 		if (chk->rec.chunk_id.id == SCTP_COOKIE_ECHO) {
 			sctp_timer_start(SCTP_TIMER_TYPE_COOKIE, inp, stcb, chk->whoTo);
 			use_zero_crc = false;
 		} else if (chk->rec.chunk_id.id == SCTP_ASCONF) {
 			/* XXXMT: Can this happen? */
 			sctp_timer_start(SCTP_TIMER_TYPE_ASCONF, inp, stcb, chk->whoTo);
 			use_zero_crc = false;
 		}
 		chk->snd_count++;	/* update our count */
 		if ((error = sctp_lowlevel_chunk_output(inp, stcb, chk->whoTo,
 		    (struct sockaddr *)&chk->whoTo->ro._l_addr, m,
 		    auth_offset, auth, stcb->asoc.authinfo.active_keyid,
 		    no_fragmentflg, 0, 0,
 		    inp->sctp_lport, stcb->rport, htonl(stcb->asoc.peer_vtag),
 		    chk->whoTo->port, NULL,
 		    0, 0,
 		    use_zero_crc,
 		    so_locked))) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 			if (error == ENOBUFS) {
 				asoc->ifp_had_enobuf = 1;
 				SCTP_STAT_INCR(sctps_lowlevelerr);
 			}
 			return (error);
 		} else {
 			asoc->ifp_had_enobuf = 0;
 		}
 		endofchain = NULL;
 		auth = NULL;
 		auth_offset = 0;
 		/*
 		 * We don't want to mark the net->sent time here since this
 		 * we use this for HB and retrans cannot measure RTT
 		 */
 		/* (void)SCTP_GETTIME_TIMEVAL(&chk->whoTo->last_sent_time); */
 		*cnt_out += 1;
 		chk->sent = SCTP_DATAGRAM_SENT;
 		sctp_ucount_decr(stcb->asoc.sent_queue_retran_cnt);
 		if (fwd_tsn == 0) {
 			return (0);
 		} else {
 			/* Clean up the fwd-tsn list */
 			sctp_clean_up_ctl(stcb, asoc, so_locked);
 			return (0);
 		}
 	}
 	/*
 	 * Ok, it is just data retransmission we need to do or that and a
 	 * fwd-tsn with it all.
 	 */
 	if (TAILQ_EMPTY(&asoc->sent_queue)) {
 		return (SCTP_RETRAN_DONE);
 	}
 	if ((SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_ECHOED) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_WAIT)) {
 		/* not yet open, resend the cookie and that is it */
 		return (1);
 	}
 #ifdef SCTP_AUDITING_ENABLED
 	sctp_auditing(20, inp, stcb, NULL);
 #endif
 	data_auth_reqd = sctp_auth_is_required_chunk(SCTP_DATA, stcb->asoc.peer_auth_chunks);
 	TAILQ_FOREACH(chk, &asoc->sent_queue, sctp_next) {
 		if (chk->sent != SCTP_DATAGRAM_RESEND) {
 			/* No, not sent to this net or not ready for rtx */
 			continue;
 		}
 		if (chk->data == NULL) {
 			SCTP_PRINTF("TSN:%x chk->snd_count:%d chk->sent:%d can't retran - no data\n",
 			    chk->rec.data.tsn, chk->snd_count, chk->sent);
 			continue;
 		}
 		if ((SCTP_BASE_SYSCTL(sctp_max_retran_chunk)) &&
 		    (chk->snd_count >= SCTP_BASE_SYSCTL(sctp_max_retran_chunk))) {
 			struct mbuf *op_err;
 			char msg[SCTP_DIAG_INFO_LEN];
 
 			SCTP_SNPRINTF(msg, sizeof(msg), "TSN %8.8x retransmitted %d times, giving up",
 			    chk->rec.data.tsn, chk->snd_count);
 			op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
 			    msg);
 			atomic_add_int(&stcb->asoc.refcnt, 1);
 			sctp_abort_an_association(stcb->sctp_ep, stcb, op_err,
 			    false, so_locked);
 			SCTP_TCB_LOCK(stcb);
 			atomic_subtract_int(&stcb->asoc.refcnt, 1);
 			return (SCTP_RETRAN_EXIT);
 		}
 		/* pick up the net */
 		net = chk->whoTo;
 		switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 		case AF_INET:
 			mtu = net->mtu - SCTP_MIN_V4_OVERHEAD;
 			break;
 #endif
 #ifdef INET6
 		case AF_INET6:
 			mtu = net->mtu - SCTP_MIN_OVERHEAD;
 			break;
 #endif
 		default:
 			/* TSNH */
 			mtu = net->mtu;
 			break;
 		}
 
 		if ((asoc->peers_rwnd < mtu) && (asoc->total_flight > 0)) {
 			/* No room in peers rwnd */
 			uint32_t tsn;
 
 			tsn = asoc->last_acked_seq + 1;
 			if (tsn == chk->rec.data.tsn) {
 				/*
 				 * we make a special exception for this
 				 * case. The peer has no rwnd but is missing
 				 * the lowest chunk.. which is probably what
 				 * is holding up the rwnd.
 				 */
 				goto one_chunk_around;
 			}
 			return (1);
 		}
 one_chunk_around:
 		if (asoc->peers_rwnd < mtu) {
 			one_chunk = 1;
 			if ((asoc->peers_rwnd == 0) &&
 			    (asoc->total_flight == 0)) {
 				chk->window_probe = 1;
 				chk->whoTo->window_probe = 1;
 			}
 		}
 #ifdef SCTP_AUDITING_ENABLED
 		sctp_audit_log(0xC3, 2);
 #endif
 		bundle_at = 0;
 		m = NULL;
 		net->fast_retran_ip = 0;
 		if (chk->rec.data.doing_fast_retransmit == 0) {
 			/*
 			 * if no FR in progress skip destination that have
 			 * flight_size > cwnd.
 			 */
 			if (net->flight_size >= net->cwnd) {
 				continue;
 			}
 		} else {
 			/*
 			 * Mark the destination net to have FR recovery
 			 * limits put on it.
 			 */
 			*fr_done = 1;
 			net->fast_retran_ip = 1;
 		}
 
 		/*
 		 * if no AUTH is yet included and this chunk requires it,
 		 * make sure to account for it.  We don't apply the size
 		 * until the AUTH chunk is actually added below in case
 		 * there is no room for this chunk.
 		 */
 		if (data_auth_reqd && (auth == NULL)) {
 			dmtu = sctp_get_auth_chunk_len(stcb->asoc.peer_hmac_id);
 		} else
 			dmtu = 0;
 
 		if ((chk->send_size <= (mtu - dmtu)) ||
 		    (chk->flags & CHUNK_FLAGS_FRAGMENT_OK)) {
 			/* ok we will add this one */
 			if (data_auth_reqd) {
 				if (auth == NULL) {
 					m = sctp_add_auth_chunk(m,
 					    &endofchain,
 					    &auth,
 					    &auth_offset,
 					    stcb,
 					    SCTP_DATA);
 					auth_keyid = chk->auth_keyid;
 					override_ok = 0;
 					SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 				} else if (override_ok) {
 					auth_keyid = chk->auth_keyid;
 					override_ok = 0;
 				} else if (chk->auth_keyid != auth_keyid) {
 					/* different keyid, so done bundling */
 					break;
 				}
 			}
 			m = sctp_copy_mbufchain(chk->data, m, &endofchain, 0, chk->send_size, chk->copy_by_ref);
 			if (m == NULL) {
 				SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 				return (ENOMEM);
 			}
 			/* Do clear IP_DF ? */
 			if (chk->flags & CHUNK_FLAGS_FRAGMENT_OK) {
 				no_fragmentflg = 0;
 			}
 			/* update our MTU size */
 			if (mtu > (chk->send_size + dmtu))
 				mtu -= (chk->send_size + dmtu);
 			else
 				mtu = 0;
 			data_list[bundle_at++] = chk;
 			if (one_chunk && (asoc->total_flight <= 0)) {
 				SCTP_STAT_INCR(sctps_windowprobed);
 			}
 		}
 		if (one_chunk == 0) {
 			/*
 			 * now are there anymore forward from chk to pick
 			 * up?
 			 */
 			for (fwd = TAILQ_NEXT(chk, sctp_next); fwd != NULL; fwd = TAILQ_NEXT(fwd, sctp_next)) {
 				if (fwd->sent != SCTP_DATAGRAM_RESEND) {
 					/* Nope, not for retran */
 					continue;
 				}
 				if (fwd->whoTo != net) {
 					/* Nope, not the net in question */
 					continue;
 				}
 				if (data_auth_reqd && (auth == NULL)) {
 					dmtu = sctp_get_auth_chunk_len(stcb->asoc.peer_hmac_id);
 				} else
 					dmtu = 0;
 				if (fwd->send_size <= (mtu - dmtu)) {
 					if (data_auth_reqd) {
 						if (auth == NULL) {
 							m = sctp_add_auth_chunk(m,
 							    &endofchain,
 							    &auth,
 							    &auth_offset,
 							    stcb,
 							    SCTP_DATA);
 							auth_keyid = fwd->auth_keyid;
 							override_ok = 0;
 							SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 						} else if (override_ok) {
 							auth_keyid = fwd->auth_keyid;
 							override_ok = 0;
 						} else if (fwd->auth_keyid != auth_keyid) {
 							/*
 							 * different keyid,
 							 * so done bundling
 							 */
 							break;
 						}
 					}
 					m = sctp_copy_mbufchain(fwd->data, m, &endofchain, 0, fwd->send_size, fwd->copy_by_ref);
 					if (m == NULL) {
 						SCTP_LTRACE_ERR_RET(inp, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 						return (ENOMEM);
 					}
 					/* Do clear IP_DF ? */
 					if (fwd->flags & CHUNK_FLAGS_FRAGMENT_OK) {
 						no_fragmentflg = 0;
 					}
 					/* update our MTU size */
 					if (mtu > (fwd->send_size + dmtu))
 						mtu -= (fwd->send_size + dmtu);
 					else
 						mtu = 0;
 					data_list[bundle_at++] = fwd;
 					if (bundle_at >= SCTP_MAX_DATA_BUNDLING) {
 						break;
 					}
 				} else {
 					/* can't fit so we are done */
 					break;
 				}
 			}
 		}
 		/* Is there something to send for this destination? */
 		if (m) {
 			/*
 			 * No matter if we fail/or succeed we should start a
 			 * timer. A failure is like a lost IP packet :-)
 			 */
 			if (!SCTP_OS_TIMER_PENDING(&net->rxt_timer.timer)) {
 				/*
 				 * no timer running on this destination
 				 * restart it.
 				 */
 				sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, net);
 				tmr_started = 1;
 			}
 			/* Now lets send it, if there is anything to send :> */
 			if ((error = sctp_lowlevel_chunk_output(inp, stcb, net,
 			    (struct sockaddr *)&net->ro._l_addr, m,
 			    auth_offset, auth, auth_keyid,
 			    no_fragmentflg, 0, 0,
 			    inp->sctp_lport, stcb->rport, htonl(stcb->asoc.peer_vtag),
 			    net->port, NULL,
 			    0, 0,
 			    asoc->zero_checksum == 2,
 			    so_locked))) {
 				/* error, we could not output */
 				SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 				if (error == ENOBUFS) {
 					asoc->ifp_had_enobuf = 1;
 					SCTP_STAT_INCR(sctps_lowlevelerr);
 				}
 				return (error);
 			} else {
 				asoc->ifp_had_enobuf = 0;
 			}
 			endofchain = NULL;
 			auth = NULL;
 			auth_offset = 0;
 			/* For HB's */
 			/*
 			 * We don't want to mark the net->sent time here
 			 * since this we use this for HB and retrans cannot
 			 * measure RTT
 			 */
 			/* (void)SCTP_GETTIME_TIMEVAL(&net->last_sent_time); */
 
 			/* For auto-close */
 			if (*now_filled == 0) {
 				(void)SCTP_GETTIME_TIMEVAL(&asoc->time_last_sent);
 				*now = asoc->time_last_sent;
 				*now_filled = 1;
 			} else {
 				asoc->time_last_sent = *now;
 			}
 			*cnt_out += bundle_at;
 #ifdef SCTP_AUDITING_ENABLED
 			sctp_audit_log(0xC4, bundle_at);
 #endif
 			if (bundle_at) {
 				tsns_sent = data_list[0]->rec.data.tsn;
 			}
 			for (i = 0; i < bundle_at; i++) {
 				SCTP_STAT_INCR(sctps_sendretransdata);
 				data_list[i]->sent = SCTP_DATAGRAM_SENT;
 				/*
 				 * When we have a revoked data, and we
 				 * retransmit it, then we clear the revoked
 				 * flag since this flag dictates if we
 				 * subtracted from the fs
 				 */
 				if (data_list[i]->rec.data.chunk_was_revoked) {
 					/* Deflate the cwnd */
 					data_list[i]->whoTo->cwnd -= data_list[i]->book_size;
 					data_list[i]->rec.data.chunk_was_revoked = 0;
 				}
 				data_list[i]->snd_count++;
 				sctp_ucount_decr(asoc->sent_queue_retran_cnt);
 				/* record the time */
 				data_list[i]->sent_rcv_time = asoc->time_last_sent;
 				if (data_list[i]->book_size_scale) {
 					/*
 					 * need to double the book size on
 					 * this one
 					 */
 					data_list[i]->book_size_scale = 0;
 					/*
 					 * Since we double the booksize, we
 					 * must also double the output queue
 					 * size, since this get shrunk when
 					 * we free by this amount.
 					 */
 					atomic_add_int(&((asoc)->total_output_queue_size), data_list[i]->book_size);
 					data_list[i]->book_size *= 2;
 				} else {
 					if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_RWND_ENABLE) {
 						sctp_log_rwnd(SCTP_DECREASE_PEER_RWND,
 						    asoc->peers_rwnd, data_list[i]->send_size, SCTP_BASE_SYSCTL(sctp_peer_chunk_oh));
 					}
 					asoc->peers_rwnd = sctp_sbspace_sub(asoc->peers_rwnd,
 					    (uint32_t)(data_list[i]->send_size +
 					    SCTP_BASE_SYSCTL(sctp_peer_chunk_oh)));
 				}
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_FLIGHT_LOGGING_ENABLE) {
 					sctp_misc_ints(SCTP_FLIGHT_LOG_UP_RSND,
 					    data_list[i]->whoTo->flight_size,
 					    data_list[i]->book_size,
 					    (uint32_t)(uintptr_t)data_list[i]->whoTo,
 					    data_list[i]->rec.data.tsn);
 				}
 				sctp_flight_size_increase(data_list[i]);
 				sctp_total_flight_increase(stcb, data_list[i]);
 				if (asoc->peers_rwnd < stcb->sctp_ep->sctp_ep.sctp_sws_sender) {
 					/* SWS sender side engages */
 					asoc->peers_rwnd = 0;
 				}
 				if ((i == 0) &&
 				    (data_list[i]->rec.data.doing_fast_retransmit)) {
 					SCTP_STAT_INCR(sctps_sendfastretrans);
 					if ((data_list[i] == TAILQ_FIRST(&asoc->sent_queue)) &&
 					    (tmr_started == 0)) {
 						/*-
 						 * ok we just fast-retrans'd
 						 * the lowest TSN, i.e the
 						 * first on the list. In
 						 * this case we want to give
 						 * some more time to get a
 						 * SACK back without a
 						 * t3-expiring.
 						 */
 						sctp_timer_stop(SCTP_TIMER_TYPE_SEND, inp, stcb, net,
 						    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_2);
 						sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, net);
 					}
 				}
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 				sctp_log_cwnd(stcb, net, tsns_sent, SCTP_CWND_LOG_FROM_RESEND);
 			}
 #ifdef SCTP_AUDITING_ENABLED
 			sctp_auditing(21, inp, stcb, NULL);
 #endif
 		} else {
 			/* None will fit */
 			return (1);
 		}
 		if (asoc->sent_queue_retran_cnt <= 0) {
 			/* all done we have no more to retran */
 			asoc->sent_queue_retran_cnt = 0;
 			break;
 		}
 		if (one_chunk) {
 			/* No more room in rwnd */
 			return (1);
 		}
 		/* stop the for loop here. we sent out a packet */
 		break;
 	}
 	return (0);
 }
 
 static void
 sctp_timer_validation(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     struct sctp_association *asoc)
 {
 	struct sctp_nets *net;
 
 	/* Validate that a timer is running somewhere */
 	TAILQ_FOREACH(net, &asoc->nets, sctp_next) {
 		if (SCTP_OS_TIMER_PENDING(&net->rxt_timer.timer)) {
 			/* Here is a timer */
 			return;
 		}
 	}
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	/* Gak, we did not have a timer somewhere */
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "Deadlock avoided starting timer on a dest at retran\n");
 	if (asoc->alternate) {
 		sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, asoc->alternate);
 	} else {
 		sctp_timer_start(SCTP_TIMER_TYPE_SEND, inp, stcb, asoc->primary_destination);
 	}
 	return;
 }
 
 void
 sctp_chunk_output(struct sctp_inpcb *inp,
     struct sctp_tcb *stcb,
     int from_where,
     int so_locked)
 {
 	/*-
 	 * Ok this is the generic chunk service queue. we must do the
 	 * following:
 	 * - See if there are retransmits pending, if so we must
 	 *   do these first.
 	 * - Service the stream queue that is next, moving any
 	 *   message (note I must get a complete message i.e.
 	 *   FIRST/MIDDLE and LAST to the out queue in one pass) and assigning
 	 *   TSN's
 	 * - Check to see if the cwnd/rwnd allows any output, if so we
 	 *   go ahead and formulate and send the low level chunks. Making sure
 	 *   to combine any control in the control chunk queue also.
 	 */
 	struct sctp_association *asoc;
 	struct sctp_nets *net;
 	int error = 0, num_out, tot_out = 0, ret = 0, reason_code;
 	unsigned int burst_cnt = 0;
 	struct timeval now;
 	int now_filled = 0;
 	int nagle_on;
 	uint32_t frag_point = sctp_get_frag_point(stcb);
 	int un_sent = 0;
 	int fr_done;
 	unsigned int tot_frs = 0;
 
 	asoc = &stcb->asoc;
 do_it_again:
 	/* The Nagle algorithm is only applied when handling a send call. */
 	if (from_where == SCTP_OUTPUT_FROM_USR_SEND) {
 		if (sctp_is_feature_on(inp, SCTP_PCB_FLAGS_NODELAY)) {
 			nagle_on = 0;
 		} else {
 			nagle_on = 1;
 		}
 	} else {
 		nagle_on = 0;
 	}
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	un_sent = (stcb->asoc.total_output_queue_size - stcb->asoc.total_flight);
 
 	if ((un_sent <= 0) &&
 	    (TAILQ_EMPTY(&asoc->control_send_queue)) &&
 	    (TAILQ_EMPTY(&asoc->asconf_send_queue)) &&
 	    (asoc->sent_queue_retran_cnt == 0) &&
 	    (asoc->trigger_reset == 0)) {
 		/* Nothing to do unless there is something to be sent left */
 		return;
 	}
 	/*
 	 * Do we have something to send, data or control AND a sack timer
 	 * running, if so piggy-back the sack.
 	 */
 	if (SCTP_OS_TIMER_PENDING(&stcb->asoc.dack_timer.timer)) {
 		sctp_send_sack(stcb, so_locked);
 		sctp_timer_stop(SCTP_TIMER_TYPE_RECV, stcb->sctp_ep, stcb, NULL,
 		    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_3);
 	}
 	while (asoc->sent_queue_retran_cnt) {
 		/*-
 		 * Ok, it is retransmission time only, we send out only ONE
 		 * packet with a single call off to the retran code.
 		 */
 		if (from_where == SCTP_OUTPUT_FROM_COOKIE_ACK) {
 			/*-
 			 * Special hook for handling cookies discarded
 			 * by peer that carried data. Send cookie-ack only
 			 * and then the next call with get the retran's.
 			 */
 			(void)sctp_med_chunk_output(inp, stcb, asoc, &num_out, &reason_code, 1,
 			    from_where,
 			    &now, &now_filled, frag_point, so_locked);
 			return;
 		} else if (from_where != SCTP_OUTPUT_FROM_HB_TMR) {
 			/* if its not from a HB then do it */
 			fr_done = 0;
 			ret = sctp_chunk_retransmission(inp, stcb, asoc, &num_out, &now, &now_filled, &fr_done, so_locked);
 			if (fr_done) {
 				tot_frs++;
 			}
 		} else {
 			/*
 			 * its from any other place, we don't allow retran
 			 * output (only control)
 			 */
 			ret = 1;
 		}
 		if (ret > 0) {
 			/* Can't send anymore */
 			/*-
 			 * now lets push out control by calling med-level
 			 * output once. this assures that we WILL send HB's
 			 * if queued too.
 			 */
 			(void)sctp_med_chunk_output(inp, stcb, asoc, &num_out, &reason_code, 1,
 			    from_where,
 			    &now, &now_filled, frag_point, so_locked);
 #ifdef SCTP_AUDITING_ENABLED
 			sctp_auditing(8, inp, stcb, NULL);
 #endif
 			sctp_timer_validation(inp, stcb, asoc);
 			return;
 		}
 		if (ret < 0) {
 			/*-
 			 * The count was off.. retran is not happening so do
 			 * the normal retransmission.
 			 */
 #ifdef SCTP_AUDITING_ENABLED
 			sctp_auditing(9, inp, stcb, NULL);
 #endif
 			if (ret == SCTP_RETRAN_EXIT) {
 				return;
 			}
 			break;
 		}
 		if (from_where == SCTP_OUTPUT_FROM_T3) {
 			/* Only one transmission allowed out of a timeout */
 #ifdef SCTP_AUDITING_ENABLED
 			sctp_auditing(10, inp, stcb, NULL);
 #endif
 			/* Push out any control */
 			(void)sctp_med_chunk_output(inp, stcb, asoc, &num_out, &reason_code, 1, from_where,
 			    &now, &now_filled, frag_point, so_locked);
 			return;
 		}
 		if ((asoc->fr_max_burst > 0) && (tot_frs >= asoc->fr_max_burst)) {
 			/* Hit FR burst limit */
 			return;
 		}
 		if ((num_out == 0) && (ret == 0)) {
 			/* No more retrans to send */
 			break;
 		}
 	}
 #ifdef SCTP_AUDITING_ENABLED
 	sctp_auditing(12, inp, stcb, NULL);
 #endif
 	/* Check for bad destinations, if they exist move chunks around. */
 	TAILQ_FOREACH(net, &asoc->nets, sctp_next) {
 		if ((net->dest_state & SCTP_ADDR_REACHABLE) == 0) {
 			/*-
 			 * if possible move things off of this address we
 			 * still may send below due to the dormant state but
 			 * we try to find an alternate address to send to
 			 * and if we have one we move all queued data on the
 			 * out wheel to this alternate address.
 			 */
 			if (net->ref_count > 1)
 				sctp_move_chunks_from_net(stcb, net);
 		} else {
 			/*-
 			 * if ((asoc->sat_network) || (net->addr_is_local))
 			 * { burst_limit = asoc->max_burst *
 			 * SCTP_SAT_NETWORK_BURST_INCR; }
 			 */
 			if (asoc->max_burst > 0) {
 				if (SCTP_BASE_SYSCTL(sctp_use_cwnd_based_maxburst)) {
 					if ((net->flight_size + (asoc->max_burst * net->mtu)) < net->cwnd) {
 						/*
 						 * JRS - Use the congestion
 						 * control given in the
 						 * congestion control module
 						 */
 						asoc->cc_functions.sctp_cwnd_update_after_output(stcb, net, asoc->max_burst);
 						if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_MAXBURST_ENABLE) {
 							sctp_log_maxburst(stcb, net, 0, asoc->max_burst, SCTP_MAX_BURST_APPLIED);
 						}
 						SCTP_STAT_INCR(sctps_maxburstqueued);
 					}
 					net->fast_retran_ip = 0;
 				} else {
 					if (net->flight_size == 0) {
 						/*
 						 * Should be decaying the
 						 * cwnd here
 						 */
 						;
 					}
 				}
 			}
 		}
 	}
 	burst_cnt = 0;
 	do {
 		error = sctp_med_chunk_output(inp, stcb, asoc, &num_out,
 		    &reason_code, 0, from_where,
 		    &now, &now_filled, frag_point, so_locked);
 		if (error) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "Error %d was returned from med-c-op\n", error);
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_MAXBURST_ENABLE) {
 				sctp_log_maxburst(stcb, asoc->primary_destination, error, burst_cnt, SCTP_MAX_BURST_ERROR_STOP);
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 				sctp_log_cwnd(stcb, NULL, error, SCTP_SEND_NOW_COMPLETES);
 				sctp_log_cwnd(stcb, NULL, 0xdeadbeef, SCTP_SEND_NOW_COMPLETES);
 			}
 			break;
 		}
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "m-c-o put out %d\n", num_out);
 
 		tot_out += num_out;
 		burst_cnt++;
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 			sctp_log_cwnd(stcb, NULL, num_out, SCTP_SEND_NOW_COMPLETES);
 			if (num_out == 0) {
 				sctp_log_cwnd(stcb, NULL, reason_code, SCTP_SEND_NOW_COMPLETES);
 			}
 		}
 		if (nagle_on) {
 			/*
 			 * When the Nagle algorithm is used, look at how
 			 * much is unsent, then if its smaller than an MTU
 			 * and we have data in flight we stop, except if we
 			 * are handling a fragmented user message.
 			 */
 			un_sent = stcb->asoc.total_output_queue_size - stcb->asoc.total_flight;
 			if ((un_sent < (int)(stcb->asoc.smallest_mtu - SCTP_MIN_OVERHEAD)) &&
 			    (stcb->asoc.total_flight > 0)) {
 /*	&&		     sctp_is_feature_on(inp, SCTP_PCB_FLAGS_EXPLICIT_EOR))) {*/
 				break;
 			}
 		}
 		if (TAILQ_EMPTY(&asoc->control_send_queue) &&
 		    TAILQ_EMPTY(&asoc->send_queue) &&
 		    sctp_is_there_unsent_data(stcb, so_locked) == 0) {
 			/* Nothing left to send */
 			break;
 		}
 		if ((stcb->asoc.total_output_queue_size - stcb->asoc.total_flight) <= 0) {
 			/* Nothing left to send */
 			break;
 		}
 	} while (num_out &&
 	    ((asoc->max_burst == 0) ||
 	    SCTP_BASE_SYSCTL(sctp_use_cwnd_based_maxburst) ||
 	    (burst_cnt < asoc->max_burst)));
 
 	if (SCTP_BASE_SYSCTL(sctp_use_cwnd_based_maxburst) == 0) {
 		if ((asoc->max_burst > 0) && (burst_cnt >= asoc->max_burst)) {
 			SCTP_STAT_INCR(sctps_maxburstqueued);
 			asoc->burst_limit_applied = 1;
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_MAXBURST_ENABLE) {
 				sctp_log_maxburst(stcb, asoc->primary_destination, 0, burst_cnt, SCTP_MAX_BURST_APPLIED);
 			}
 		} else {
 			asoc->burst_limit_applied = 0;
 		}
 	}
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_CWND_LOGGING_ENABLE) {
 		sctp_log_cwnd(stcb, NULL, tot_out, SCTP_SEND_NOW_COMPLETES);
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "Ok, we have put out %d chunks\n",
 	    tot_out);
 
 	/*-
 	 * Now we need to clean up the control chunk chain if a ECNE is on
 	 * it. It must be marked as UNSENT again so next call will continue
 	 * to send it until such time that we get a CWR, to remove it.
 	 */
 	if (stcb->asoc.ecn_echo_cnt_onq)
 		sctp_fix_ecn_echo(asoc);
 
 	if (stcb->asoc.trigger_reset) {
 		if (sctp_send_stream_reset_out_if_possible(stcb, so_locked) == 0) {
 			goto do_it_again;
 		}
 	}
 	return;
 }
 
 int
 sctp_output(
     struct sctp_inpcb *inp,
     struct mbuf *m,
     struct sockaddr *addr,
     struct mbuf *control,
     struct thread *p,
     int flags)
 {
 	if (inp == NULL) {
 		SCTP_LTRACE_ERR_RET_PKT(m, inp, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		return (EINVAL);
 	}
 
 	if (inp->sctp_socket == NULL) {
 		SCTP_LTRACE_ERR_RET_PKT(m, inp, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		return (EINVAL);
 	}
 	return (sctp_sosend(inp->sctp_socket,
 	    addr,
 	    (struct uio *)NULL,
 	    m,
 	    control,
 	    flags, p
 	    ));
 }
 
 void
 send_forward_tsn(struct sctp_tcb *stcb,
     struct sctp_association *asoc)
 {
 	struct sctp_tmit_chunk *chk, *at, *tp1, *last;
 	struct sctp_forward_tsn_chunk *fwdtsn;
 	struct sctp_strseq *strseq;
 	struct sctp_strseq_mid *strseq_m;
 	uint32_t advance_peer_ack_point;
 	unsigned int cnt_of_space, i, ovh;
 	unsigned int space_needed;
 	unsigned int cnt_of_skipped = 0;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if (chk->rec.chunk_id.id == SCTP_FORWARD_CUM_TSN) {
 			/* mark it to unsent */
 			chk->sent = SCTP_DATAGRAM_UNSENT;
 			chk->snd_count = 0;
 			/* Do we correct its output location? */
 			if (chk->whoTo) {
 				sctp_free_remote_addr(chk->whoTo);
 				chk->whoTo = NULL;
 			}
 			goto sctp_fill_in_rest;
 		}
 	}
 	/* Ok if we reach here we must build one */
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		return;
 	}
 	asoc->fwd_tsn_cnt++;
 	chk->copy_by_ref = 0;
 	/*
 	 * We don't do the old thing here since this is used not for on-wire
 	 * but to tell if we are sending a fwd-tsn by the stack during
 	 * output. And if its a IFORWARD or a FORWARD it is a fwd-tsn.
 	 */
 	chk->rec.chunk_id.id = SCTP_FORWARD_CUM_TSN;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->asoc = asoc;
 	chk->whoTo = NULL;
 	chk->data = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue, chk, sctp_next);
 	asoc->ctrl_queue_cnt++;
 sctp_fill_in_rest:
 	/*-
 	 * Here we go through and fill out the part that deals with
 	 * stream/seq of the ones we skip.
 	 */
 	SCTP_BUF_LEN(chk->data) = 0;
 	TAILQ_FOREACH(at, &asoc->sent_queue, sctp_next) {
 		if ((at->sent != SCTP_FORWARD_TSN_SKIP) &&
 		    (at->sent != SCTP_DATAGRAM_NR_ACKED)) {
 			/* no more to look at */
 			break;
 		}
 		if (!asoc->idata_supported && (at->rec.data.rcv_flags & SCTP_DATA_UNORDERED)) {
 			/* We don't report these */
 			continue;
 		}
 		cnt_of_skipped++;
 	}
 	if (asoc->idata_supported) {
 		space_needed = (sizeof(struct sctp_forward_tsn_chunk) +
 		    (cnt_of_skipped * sizeof(struct sctp_strseq_mid)));
 	} else {
 		space_needed = (sizeof(struct sctp_forward_tsn_chunk) +
 		    (cnt_of_skipped * sizeof(struct sctp_strseq)));
 	}
 	cnt_of_space = (unsigned int)M_TRAILINGSPACE(chk->data);
 
 	if (stcb->sctp_ep->sctp_flags & SCTP_PCB_FLAGS_BOUND_V6) {
 		ovh = SCTP_MIN_OVERHEAD;
 	} else {
 		ovh = SCTP_MIN_V4_OVERHEAD;
 	}
 	if (cnt_of_space > (asoc->smallest_mtu - ovh)) {
 		/* trim to a mtu size */
 		cnt_of_space = asoc->smallest_mtu - ovh;
 	}
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_TRY_ADVANCE) {
 		sctp_misc_ints(SCTP_FWD_TSN_CHECK,
 		    0xff, 0, cnt_of_skipped,
 		    asoc->advanced_peer_ack_point);
 	}
 	advance_peer_ack_point = asoc->advanced_peer_ack_point;
 	if (cnt_of_space < space_needed) {
 		/*-
 		 * ok we must trim down the chunk by lowering the
 		 * advance peer ack point.
 		 */
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_TRY_ADVANCE) {
 			sctp_misc_ints(SCTP_FWD_TSN_CHECK,
 			    0xff, 0xff, cnt_of_space,
 			    space_needed);
 		}
 		cnt_of_skipped = cnt_of_space - sizeof(struct sctp_forward_tsn_chunk);
 		if (asoc->idata_supported) {
 			cnt_of_skipped /= sizeof(struct sctp_strseq_mid);
 		} else {
 			cnt_of_skipped /= sizeof(struct sctp_strseq);
 		}
 		/*-
 		 * Go through and find the TSN that will be the one
 		 * we report.
 		 */
 		at = TAILQ_FIRST(&asoc->sent_queue);
 		if (at != NULL) {
 			for (i = 0; i < cnt_of_skipped; i++) {
 				tp1 = TAILQ_NEXT(at, sctp_next);
 				if (tp1 == NULL) {
 					break;
 				}
 				at = tp1;
 			}
 		}
 		if (at && SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LOG_TRY_ADVANCE) {
 			sctp_misc_ints(SCTP_FWD_TSN_CHECK,
 			    0xff, cnt_of_skipped, at->rec.data.tsn,
 			    asoc->advanced_peer_ack_point);
 		}
 		last = at;
 		/*-
 		 * last now points to last one I can report, update
 		 * peer ack point
 		 */
 		if (last) {
 			advance_peer_ack_point = last->rec.data.tsn;
 		}
 		if (asoc->idata_supported) {
 			space_needed = sizeof(struct sctp_forward_tsn_chunk) +
 			    cnt_of_skipped * sizeof(struct sctp_strseq_mid);
 		} else {
 			space_needed = sizeof(struct sctp_forward_tsn_chunk) +
 			    cnt_of_skipped * sizeof(struct sctp_strseq);
 		}
 	}
 	chk->send_size = space_needed;
 	/* Setup the chunk */
 	fwdtsn = mtod(chk->data, struct sctp_forward_tsn_chunk *);
 	fwdtsn->ch.chunk_length = htons(chk->send_size);
 	fwdtsn->ch.chunk_flags = 0;
 	if (asoc->idata_supported) {
 		fwdtsn->ch.chunk_type = SCTP_IFORWARD_CUM_TSN;
 	} else {
 		fwdtsn->ch.chunk_type = SCTP_FORWARD_CUM_TSN;
 	}
 	fwdtsn->new_cumulative_tsn = htonl(advance_peer_ack_point);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	fwdtsn++;
 	/*-
 	 * Move pointer to after the fwdtsn and transfer to the
 	 * strseq pointer.
 	 */
 	if (asoc->idata_supported) {
 		strseq_m = (struct sctp_strseq_mid *)fwdtsn;
 		strseq = NULL;
 	} else {
 		strseq = (struct sctp_strseq *)fwdtsn;
 		strseq_m = NULL;
 	}
 	/*-
 	 * Now populate the strseq list. This is done blindly
 	 * without pulling out duplicate stream info. This is
 	 * inefficient but won't harm the process since the peer will
 	 * look at these in sequence and will thus release anything.
 	 * It could mean we exceed the PMTU and chop off some that
 	 * we could have included.. but this is unlikely (aka 1432/4
 	 * would mean 300+ stream seq's would have to be reported in
 	 * one FWD-TSN. With a bit of work we can later FIX this to
 	 * optimize and pull out duplicates.. but it does add more
 	 * overhead. So for now... not!
 	 */
 	i = 0;
 	TAILQ_FOREACH(at, &asoc->sent_queue, sctp_next) {
 		if (i >= cnt_of_skipped) {
 			break;
 		}
 		if (!asoc->idata_supported && (at->rec.data.rcv_flags & SCTP_DATA_UNORDERED)) {
 			/* We don't report these */
 			continue;
 		}
 		if (at->rec.data.tsn == advance_peer_ack_point) {
 			at->rec.data.fwd_tsn_cnt = 0;
 		}
 		if (asoc->idata_supported) {
 			strseq_m->sid = htons(at->rec.data.sid);
 			if (at->rec.data.rcv_flags & SCTP_DATA_UNORDERED) {
 				strseq_m->flags = htons(PR_SCTP_UNORDERED_FLAG);
 			} else {
 				strseq_m->flags = 0;
 			}
 			strseq_m->mid = htonl(at->rec.data.mid);
 			strseq_m++;
 		} else {
 			strseq->sid = htons(at->rec.data.sid);
 			strseq->ssn = htons((uint16_t)at->rec.data.mid);
 			strseq++;
 		}
 		i++;
 	}
 	return;
 }
 
 void
 sctp_send_sack(struct sctp_tcb *stcb, int so_locked)
 {
 	/*-
 	 * Queue up a SACK or NR-SACK in the control queue.
 	 * We must first check to see if a SACK or NR-SACK is
 	 * somehow on the control queue.
 	 * If so, we will take and and remove the old one.
 	 */
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk, *a_chk;
 	struct sctp_sack_chunk *sack;
 	struct sctp_nr_sack_chunk *nr_sack;
 	struct sctp_gap_ack_block *gap_descriptor;
 	const struct sack_track *selector;
 	int mergeable = 0;
 	int offset;
 	caddr_t limit;
 	uint32_t *dup;
 	int limit_reached = 0;
 	unsigned int i, siz, j;
 	unsigned int num_gap_blocks = 0, num_nr_gap_blocks = 0, space;
 	int num_dups = 0;
 	int space_req;
 	uint32_t highest_tsn;
 	uint8_t flags;
 	uint8_t type;
 	uint8_t tsn_map;
 
 	if (stcb->asoc.nrsack_supported == 1) {
 		type = SCTP_NR_SELECTIVE_ACK;
 	} else {
 		type = SCTP_SELECTIVE_ACK;
 	}
 	a_chk = NULL;
 	asoc = &stcb->asoc;
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if (asoc->last_data_chunk_from == NULL) {
 		/* Hmm we never received anything */
 		return;
 	}
 	sctp_slide_mapping_arrays(stcb);
 	sctp_set_rwnd(stcb, asoc);
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if (chk->rec.chunk_id.id == type) {
 			/* Hmm, found a sack already on queue, remove it */
 			TAILQ_REMOVE(&asoc->control_send_queue, chk, sctp_next);
 			asoc->ctrl_queue_cnt--;
 			a_chk = chk;
 			if (a_chk->data) {
 				sctp_m_freem(a_chk->data);
 				a_chk->data = NULL;
 			}
 			if (a_chk->whoTo) {
 				sctp_free_remote_addr(a_chk->whoTo);
 				a_chk->whoTo = NULL;
 			}
 			break;
 		}
 	}
 	if (a_chk == NULL) {
 		sctp_alloc_a_chunk(stcb, a_chk);
 		if (a_chk == NULL) {
 			/* No memory so we drop the idea, and set a timer */
 			if (stcb->asoc.delayed_ack) {
 				sctp_timer_stop(SCTP_TIMER_TYPE_RECV,
 				    stcb->sctp_ep, stcb, NULL,
 				    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_4);
 				sctp_timer_start(SCTP_TIMER_TYPE_RECV,
 				    stcb->sctp_ep, stcb, NULL);
 			} else {
 				stcb->asoc.send_sack = 1;
 			}
 			return;
 		}
 		a_chk->copy_by_ref = 0;
 		a_chk->rec.chunk_id.id = type;
 		a_chk->rec.chunk_id.can_take_data = 1;
 	}
 	/* Clear our pkt counts */
 	asoc->data_pkts_seen = 0;
 
 	a_chk->flags = 0;
 	a_chk->asoc = asoc;
 	a_chk->snd_count = 0;
 	a_chk->send_size = 0;	/* fill in later */
 	a_chk->sent = SCTP_DATAGRAM_UNSENT;
 	a_chk->whoTo = NULL;
 
 	if ((asoc->last_data_chunk_from->dest_state & SCTP_ADDR_REACHABLE) == 0) {
 		/*-
 		 * Ok, the destination for the SACK is unreachable, lets see if
 		 * we can select an alternate to asoc->last_data_chunk_from
 		 */
 		a_chk->whoTo = sctp_find_alternate_net(stcb, asoc->last_data_chunk_from, 0);
 		if (a_chk->whoTo == NULL) {
 			/* Nope, no alternate */
 			a_chk->whoTo = asoc->last_data_chunk_from;
 		}
 	} else {
 		a_chk->whoTo = asoc->last_data_chunk_from;
 	}
 	if (a_chk->whoTo) {
 		atomic_add_int(&a_chk->whoTo->ref_count, 1);
 	}
 	if (SCTP_TSN_GT(asoc->highest_tsn_inside_map, asoc->highest_tsn_inside_nr_map)) {
 		highest_tsn = asoc->highest_tsn_inside_map;
 	} else {
 		highest_tsn = asoc->highest_tsn_inside_nr_map;
 	}
 	if (highest_tsn == asoc->cumulative_tsn) {
 		/* no gaps */
 		if (type == SCTP_SELECTIVE_ACK) {
 			space_req = sizeof(struct sctp_sack_chunk);
 		} else {
 			space_req = sizeof(struct sctp_nr_sack_chunk);
 		}
 	} else {
 		/* gaps get a cluster */
 		space_req = MCLBYTES;
 	}
 	/* Ok now lets formulate a MBUF with our sack */
 	a_chk->data = sctp_get_mbuf_for_msg(space_req, 0, M_NOWAIT, 1, MT_DATA);
 	if ((a_chk->data == NULL) ||
 	    (a_chk->whoTo == NULL)) {
 		/* rats, no mbuf memory */
 		if (a_chk->data) {
 			/* was a problem with the destination */
 			sctp_m_freem(a_chk->data);
 			a_chk->data = NULL;
 		}
 		sctp_free_a_chunk(stcb, a_chk, so_locked);
 		/* sa_ignore NO_NULL_CHK */
 		if (stcb->asoc.delayed_ack) {
 			sctp_timer_stop(SCTP_TIMER_TYPE_RECV,
 			    stcb->sctp_ep, stcb, NULL,
 			    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_5);
 			sctp_timer_start(SCTP_TIMER_TYPE_RECV,
 			    stcb->sctp_ep, stcb, NULL);
 		} else {
 			stcb->asoc.send_sack = 1;
 		}
 		return;
 	}
 	/* ok, lets go through and fill it in */
 	SCTP_BUF_RESV_UF(a_chk->data, SCTP_MIN_OVERHEAD);
 	space = (unsigned int)M_TRAILINGSPACE(a_chk->data);
 	if (space > (a_chk->whoTo->mtu - SCTP_MIN_OVERHEAD)) {
 		space = (a_chk->whoTo->mtu - SCTP_MIN_OVERHEAD);
 	}
 	limit = mtod(a_chk->data, caddr_t);
 	limit += space;
 
 	flags = 0;
 
 	if ((asoc->sctp_cmt_on_off > 0) &&
 	    SCTP_BASE_SYSCTL(sctp_cmt_use_dac)) {
 		/*-
 		 * CMT DAC algorithm: If 2 (i.e., 0x10) packets have been
 		 * received, then set high bit to 1, else 0. Reset
 		 * pkts_rcvd.
 		 */
 		flags |= (asoc->cmt_dac_pkts_rcvd << 6);
 		asoc->cmt_dac_pkts_rcvd = 0;
 	}
 #ifdef SCTP_ASOCLOG_OF_TSNS
 	stcb->asoc.cumack_logsnt[stcb->asoc.cumack_log_atsnt] = asoc->cumulative_tsn;
 	stcb->asoc.cumack_log_atsnt++;
 	if (stcb->asoc.cumack_log_atsnt >= SCTP_TSN_LOG_SIZE) {
 		stcb->asoc.cumack_log_atsnt = 0;
 	}
 #endif
 	/* reset the readers interpretation */
 	stcb->freed_by_sorcv_sincelast = 0;
 
 	if (type == SCTP_SELECTIVE_ACK) {
 		sack = mtod(a_chk->data, struct sctp_sack_chunk *);
 		nr_sack = NULL;
 		gap_descriptor = (struct sctp_gap_ack_block *)((caddr_t)sack + sizeof(struct sctp_sack_chunk));
 		if (highest_tsn > asoc->mapping_array_base_tsn) {
 			siz = (((highest_tsn - asoc->mapping_array_base_tsn) + 1) + 7) / 8;
 		} else {
 			siz = (((MAX_TSN - asoc->mapping_array_base_tsn) + 1) + highest_tsn + 7) / 8;
 		}
 	} else {
 		sack = NULL;
 		nr_sack = mtod(a_chk->data, struct sctp_nr_sack_chunk *);
 		gap_descriptor = (struct sctp_gap_ack_block *)((caddr_t)nr_sack + sizeof(struct sctp_nr_sack_chunk));
 		if (asoc->highest_tsn_inside_map > asoc->mapping_array_base_tsn) {
 			siz = (((asoc->highest_tsn_inside_map - asoc->mapping_array_base_tsn) + 1) + 7) / 8;
 		} else {
 			siz = (((MAX_TSN - asoc->mapping_array_base_tsn) + 1) + asoc->highest_tsn_inside_map + 7) / 8;
 		}
 	}
 
 	if (SCTP_TSN_GT(asoc->mapping_array_base_tsn, asoc->cumulative_tsn)) {
 		offset = 1;
 	} else {
 		offset = asoc->mapping_array_base_tsn - asoc->cumulative_tsn;
 	}
 	if (((type == SCTP_SELECTIVE_ACK) &&
 	    SCTP_TSN_GT(highest_tsn, asoc->cumulative_tsn)) ||
 	    ((type == SCTP_NR_SELECTIVE_ACK) &&
 	    SCTP_TSN_GT(asoc->highest_tsn_inside_map, asoc->cumulative_tsn))) {
 		/* we have a gap .. maybe */
 		for (i = 0; i < siz; i++) {
 			tsn_map = asoc->mapping_array[i];
 			if (type == SCTP_SELECTIVE_ACK) {
 				tsn_map |= asoc->nr_mapping_array[i];
 			}
 			if (i == 0) {
 				/*
 				 * Clear all bits corresponding to TSNs
 				 * smaller or equal to the cumulative TSN.
 				 */
 				tsn_map &= (~0U << (1 - offset));
 			}
 			selector = &sack_array[tsn_map];
 			if (mergeable && selector->right_edge) {
 				/*
 				 * Backup, left and right edges were ok to
 				 * merge.
 				 */
 				num_gap_blocks--;
 				gap_descriptor--;
 			}
 			if (selector->num_entries == 0)
 				mergeable = 0;
 			else {
 				for (j = 0; j < selector->num_entries; j++) {
 					if (mergeable && selector->right_edge) {
 						/*
 						 * do a merge by NOT setting
 						 * the left side
 						 */
 						mergeable = 0;
 					} else {
 						/*
 						 * no merge, set the left
 						 * side
 						 */
 						mergeable = 0;
 						gap_descriptor->start = htons((selector->gaps[j].start + offset));
 					}
 					gap_descriptor->end = htons((selector->gaps[j].end + offset));
 					num_gap_blocks++;
 					gap_descriptor++;
 					if (((caddr_t)gap_descriptor + sizeof(struct sctp_gap_ack_block)) > limit) {
 						/* no more room */
 						limit_reached = 1;
 						break;
 					}
 				}
 				if (selector->left_edge) {
 					mergeable = 1;
 				}
 			}
 			if (limit_reached) {
 				/* Reached the limit stop */
 				break;
 			}
 			offset += 8;
 		}
 	}
 	if ((type == SCTP_NR_SELECTIVE_ACK) &&
 	    (limit_reached == 0)) {
 		mergeable = 0;
 
 		if (asoc->highest_tsn_inside_nr_map > asoc->mapping_array_base_tsn) {
 			siz = (((asoc->highest_tsn_inside_nr_map - asoc->mapping_array_base_tsn) + 1) + 7) / 8;
 		} else {
 			siz = (((MAX_TSN - asoc->mapping_array_base_tsn) + 1) + asoc->highest_tsn_inside_nr_map + 7) / 8;
 		}
 
 		if (SCTP_TSN_GT(asoc->mapping_array_base_tsn, asoc->cumulative_tsn)) {
 			offset = 1;
 		} else {
 			offset = asoc->mapping_array_base_tsn - asoc->cumulative_tsn;
 		}
 		if (SCTP_TSN_GT(asoc->highest_tsn_inside_nr_map, asoc->cumulative_tsn)) {
 			/* we have a gap .. maybe */
 			for (i = 0; i < siz; i++) {
 				tsn_map = asoc->nr_mapping_array[i];
 				if (i == 0) {
 					/*
 					 * Clear all bits corresponding to
 					 * TSNs smaller or equal to the
 					 * cumulative TSN.
 					 */
 					tsn_map &= (~0U << (1 - offset));
 				}
 				selector = &sack_array[tsn_map];
 				if (mergeable && selector->right_edge) {
 					/*
 					 * Backup, left and right edges were
 					 * ok to merge.
 					 */
 					num_nr_gap_blocks--;
 					gap_descriptor--;
 				}
 				if (selector->num_entries == 0)
 					mergeable = 0;
 				else {
 					for (j = 0; j < selector->num_entries; j++) {
 						if (mergeable && selector->right_edge) {
 							/*
 							 * do a merge by NOT
 							 * setting the left
 							 * side
 							 */
 							mergeable = 0;
 						} else {
 							/*
 							 * no merge, set the
 							 * left side
 							 */
 							mergeable = 0;
 							gap_descriptor->start = htons((selector->gaps[j].start + offset));
 						}
 						gap_descriptor->end = htons((selector->gaps[j].end + offset));
 						num_nr_gap_blocks++;
 						gap_descriptor++;
 						if (((caddr_t)gap_descriptor + sizeof(struct sctp_gap_ack_block)) > limit) {
 							/* no more room */
 							limit_reached = 1;
 							break;
 						}
 					}
 					if (selector->left_edge) {
 						mergeable = 1;
 					}
 				}
 				if (limit_reached) {
 					/* Reached the limit stop */
 					break;
 				}
 				offset += 8;
 			}
 		}
 	}
 	/* now we must add any dups we are going to report. */
 	if ((limit_reached == 0) && (asoc->numduptsns)) {
 		dup = (uint32_t *)gap_descriptor;
 		for (i = 0; i < asoc->numduptsns; i++) {
 			*dup = htonl(asoc->dup_tsns[i]);
 			dup++;
 			num_dups++;
 			if (((caddr_t)dup + sizeof(uint32_t)) > limit) {
 				/* no more room */
 				break;
 			}
 		}
 		asoc->numduptsns = 0;
 	}
 	/*
 	 * now that the chunk is prepared queue it to the control chunk
 	 * queue.
 	 */
 	if (type == SCTP_SELECTIVE_ACK) {
 		a_chk->send_size = (uint16_t)(sizeof(struct sctp_sack_chunk) +
 		    (num_gap_blocks + num_nr_gap_blocks) * sizeof(struct sctp_gap_ack_block) +
 		    num_dups * sizeof(int32_t));
 		SCTP_BUF_LEN(a_chk->data) = a_chk->send_size;
 		sack->sack.cum_tsn_ack = htonl(asoc->cumulative_tsn);
 		sack->sack.a_rwnd = htonl(asoc->my_rwnd);
 		sack->sack.num_gap_ack_blks = htons(num_gap_blocks);
 		sack->sack.num_dup_tsns = htons(num_dups);
 		sack->ch.chunk_type = type;
 		sack->ch.chunk_flags = flags;
 		sack->ch.chunk_length = htons(a_chk->send_size);
 	} else {
 		a_chk->send_size = (uint16_t)(sizeof(struct sctp_nr_sack_chunk) +
 		    (num_gap_blocks + num_nr_gap_blocks) * sizeof(struct sctp_gap_ack_block) +
 		    num_dups * sizeof(int32_t));
 		SCTP_BUF_LEN(a_chk->data) = a_chk->send_size;
 		nr_sack->nr_sack.cum_tsn_ack = htonl(asoc->cumulative_tsn);
 		nr_sack->nr_sack.a_rwnd = htonl(asoc->my_rwnd);
 		nr_sack->nr_sack.num_gap_ack_blks = htons(num_gap_blocks);
 		nr_sack->nr_sack.num_nr_gap_ack_blks = htons(num_nr_gap_blocks);
 		nr_sack->nr_sack.num_dup_tsns = htons(num_dups);
 		nr_sack->nr_sack.reserved = 0;
 		nr_sack->ch.chunk_type = type;
 		nr_sack->ch.chunk_flags = flags;
 		nr_sack->ch.chunk_length = htons(a_chk->send_size);
 	}
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue, a_chk, sctp_next);
 	asoc->my_last_reported_rwnd = asoc->my_rwnd;
 	asoc->ctrl_queue_cnt++;
 	asoc->send_sack = 0;
 	SCTP_STAT_INCR(sctps_sendsacks);
 	return;
 }
 
 void
 sctp_send_abort_tcb(struct sctp_tcb *stcb, struct mbuf *operr, int so_locked)
 {
 	struct mbuf *m_abort, *m, *m_last;
 	struct mbuf *m_out, *m_end = NULL;
 	struct sctp_abort_chunk *abort;
 	struct sctp_auth_chunk *auth = NULL;
 	struct sctp_nets *net;
 	uint32_t vtag;
 	uint32_t auth_offset = 0;
 	int error;
 	uint16_t cause_len, chunk_len, padding_len;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	/*-
 	 * Add an AUTH chunk, if chunk requires it and save the offset into
 	 * the chain for AUTH
 	 */
 	if (sctp_auth_is_required_chunk(SCTP_ABORT_ASSOCIATION,
 	    stcb->asoc.peer_auth_chunks)) {
 		m_out = sctp_add_auth_chunk(NULL, &m_end, &auth, &auth_offset,
 		    stcb, SCTP_ABORT_ASSOCIATION);
 		SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 	} else {
 		m_out = NULL;
 	}
 	m_abort = sctp_get_mbuf_for_msg(sizeof(struct sctp_abort_chunk), 0, M_NOWAIT, 1, MT_HEADER);
 	if (m_abort == NULL) {
 		if (m_out) {
 			sctp_m_freem(m_out);
 		}
 		if (operr) {
 			sctp_m_freem(operr);
 		}
 		return;
 	}
 	/* link in any error */
 	SCTP_BUF_NEXT(m_abort) = operr;
 	cause_len = 0;
 	m_last = NULL;
 	for (m = operr; m; m = SCTP_BUF_NEXT(m)) {
 		cause_len += (uint16_t)SCTP_BUF_LEN(m);
 		if (SCTP_BUF_NEXT(m) == NULL) {
 			m_last = m;
 		}
 	}
 	SCTP_BUF_LEN(m_abort) = sizeof(struct sctp_abort_chunk);
 	chunk_len = (uint16_t)sizeof(struct sctp_abort_chunk) + cause_len;
 	padding_len = SCTP_SIZE32(chunk_len) - chunk_len;
 	if (m_out == NULL) {
 		/* NO Auth chunk prepended, so reserve space in front */
 		SCTP_BUF_RESV_UF(m_abort, SCTP_MIN_OVERHEAD);
 		m_out = m_abort;
 	} else {
 		/* Put AUTH chunk at the front of the chain */
 		SCTP_BUF_NEXT(m_end) = m_abort;
 	}
 	if (stcb->asoc.alternate) {
 		net = stcb->asoc.alternate;
 	} else {
 		net = stcb->asoc.primary_destination;
 	}
 	/* Fill in the ABORT chunk header. */
 	abort = mtod(m_abort, struct sctp_abort_chunk *);
 	abort->ch.chunk_type = SCTP_ABORT_ASSOCIATION;
 	if (stcb->asoc.peer_vtag == 0) {
 		/* This happens iff the assoc is in COOKIE-WAIT state. */
 		vtag = stcb->asoc.my_vtag;
 		abort->ch.chunk_flags = SCTP_HAD_NO_TCB;
 	} else {
 		vtag = stcb->asoc.peer_vtag;
 		abort->ch.chunk_flags = 0;
 	}
 	abort->ch.chunk_length = htons(chunk_len);
 	/* Add padding, if necessary. */
 	if (padding_len > 0) {
 		if ((m_last == NULL) ||
 		    (sctp_add_pad_tombuf(m_last, padding_len) == NULL)) {
 			sctp_m_freem(m_out);
 			return;
 		}
 	}
 	if ((error = sctp_lowlevel_chunk_output(stcb->sctp_ep, stcb, net,
 	    (struct sockaddr *)&net->ro._l_addr,
 	    m_out, auth_offset, auth, stcb->asoc.authinfo.active_keyid, 1, 0, 0,
 	    stcb->sctp_ep->sctp_lport, stcb->rport, htonl(vtag),
 	    stcb->asoc.primary_destination->port, NULL,
 	    0, 0,
 	    stcb->asoc.zero_checksum == 2,
 	    so_locked))) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 		if (error == ENOBUFS) {
 			stcb->asoc.ifp_had_enobuf = 1;
 			SCTP_STAT_INCR(sctps_lowlevelerr);
 		}
 	} else {
 		stcb->asoc.ifp_had_enobuf = 0;
 	}
 	SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 }
 
 void
 sctp_send_shutdown_complete(struct sctp_tcb *stcb,
     struct sctp_nets *net,
     int reflect_vtag)
 {
 	/* formulate and SEND a SHUTDOWN-COMPLETE */
 	struct mbuf *m_shutdown_comp;
 	struct sctp_shutdown_complete_chunk *shutdown_complete;
 	uint32_t vtag;
 	int error;
 	uint8_t flags;
 
 	m_shutdown_comp = sctp_get_mbuf_for_msg(sizeof(struct sctp_chunkhdr), 0, M_NOWAIT, 1, MT_HEADER);
 	if (m_shutdown_comp == NULL) {
 		/* no mbuf's */
 		return;
 	}
 	if (reflect_vtag) {
 		flags = SCTP_HAD_NO_TCB;
 		vtag = stcb->asoc.my_vtag;
 	} else {
 		flags = 0;
 		vtag = stcb->asoc.peer_vtag;
 	}
 	shutdown_complete = mtod(m_shutdown_comp, struct sctp_shutdown_complete_chunk *);
 	shutdown_complete->ch.chunk_type = SCTP_SHUTDOWN_COMPLETE;
 	shutdown_complete->ch.chunk_flags = flags;
 	shutdown_complete->ch.chunk_length = htons(sizeof(struct sctp_shutdown_complete_chunk));
 	SCTP_BUF_LEN(m_shutdown_comp) = sizeof(struct sctp_shutdown_complete_chunk);
 	if ((error = sctp_lowlevel_chunk_output(stcb->sctp_ep, stcb, net,
 	    (struct sockaddr *)&net->ro._l_addr,
 	    m_shutdown_comp, 0, NULL, 0, 1, 0, 0,
 	    stcb->sctp_ep->sctp_lport, stcb->rport,
 	    htonl(vtag),
 	    net->port, NULL,
 	    0, 0,
 	    stcb->asoc.zero_checksum == 2,
 	    SCTP_SO_NOT_LOCKED))) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT3, "Gak send error %d\n", error);
 		if (error == ENOBUFS) {
 			stcb->asoc.ifp_had_enobuf = 1;
 			SCTP_STAT_INCR(sctps_lowlevelerr);
 		}
 	} else {
 		stcb->asoc.ifp_had_enobuf = 0;
 	}
 	SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 	return;
 }
 
 static void
 sctp_send_resp_msg(struct sockaddr *src, struct sockaddr *dst,
     struct sctphdr *sh, uint32_t vtag,
     uint8_t type, struct mbuf *cause,
     uint8_t mflowtype, uint32_t mflowid, uint16_t fibnum,
     uint32_t vrf_id, uint16_t port)
 {
 	struct mbuf *o_pak;
 	struct mbuf *mout;
 	struct sctphdr *shout;
 	struct sctp_chunkhdr *ch;
 #if defined(INET) || defined(INET6)
 	struct udphdr *udp;
 #endif
 	int ret, len, cause_len, padding_len;
 #ifdef INET
 	struct sockaddr_in *src_sin, *dst_sin;
 	struct ip *ip;
 #endif
 #ifdef INET6
 	struct sockaddr_in6 *src_sin6, *dst_sin6;
 	struct ip6_hdr *ip6;
 #endif
 
 	/* Compute the length of the cause and add final padding. */
 	cause_len = 0;
 	if (cause != NULL) {
 		struct mbuf *m_at, *m_last = NULL;
 
 		for (m_at = cause; m_at; m_at = SCTP_BUF_NEXT(m_at)) {
 			if (SCTP_BUF_NEXT(m_at) == NULL)
 				m_last = m_at;
 			cause_len += SCTP_BUF_LEN(m_at);
 		}
 		padding_len = cause_len % 4;
 		if (padding_len != 0) {
 			padding_len = 4 - padding_len;
 		}
 		if (padding_len != 0) {
 			if (sctp_add_pad_tombuf(m_last, padding_len) == NULL) {
 				sctp_m_freem(cause);
 				return;
 			}
 		}
 	} else {
 		padding_len = 0;
 	}
 	/* Get an mbuf for the header. */
 	len = sizeof(struct sctphdr) + sizeof(struct sctp_chunkhdr);
 	switch (dst->sa_family) {
 #ifdef INET
 	case AF_INET:
 		len += sizeof(struct ip);
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		len += sizeof(struct ip6_hdr);
 		break;
 #endif
 	default:
 		break;
 	}
 #if defined(INET) || defined(INET6)
 	if (port) {
 		len += sizeof(struct udphdr);
 	}
 #endif
 	mout = sctp_get_mbuf_for_msg(len + max_linkhdr, 1, M_NOWAIT, 1, MT_DATA);
 	if (mout == NULL) {
 		if (cause) {
 			sctp_m_freem(cause);
 		}
 		return;
 	}
 	SCTP_BUF_RESV_UF(mout, max_linkhdr);
 	SCTP_BUF_LEN(mout) = len;
 	SCTP_BUF_NEXT(mout) = cause;
 	M_SETFIB(mout, fibnum);
 	mout->m_pkthdr.flowid = mflowid;
 	M_HASHTYPE_SET(mout, mflowtype);
 #ifdef INET
 	ip = NULL;
 #endif
 #ifdef INET6
 	ip6 = NULL;
 #endif
 	switch (dst->sa_family) {
 #ifdef INET
 	case AF_INET:
 		src_sin = (struct sockaddr_in *)src;
 		dst_sin = (struct sockaddr_in *)dst;
 		ip = mtod(mout, struct ip *);
 		ip->ip_v = IPVERSION;
 		ip->ip_hl = (sizeof(struct ip) >> 2);
 		ip->ip_tos = 0;
 		ip->ip_off = htons(IP_DF);
 		ip_fillid(ip);
 		ip->ip_ttl = MODULE_GLOBAL(ip_defttl);
 		if (port) {
 			ip->ip_p = IPPROTO_UDP;
 		} else {
 			ip->ip_p = IPPROTO_SCTP;
 		}
 		ip->ip_src.s_addr = dst_sin->sin_addr.s_addr;
 		ip->ip_dst.s_addr = src_sin->sin_addr.s_addr;
 		ip->ip_sum = 0;
 		len = sizeof(struct ip);
 		shout = (struct sctphdr *)((caddr_t)ip + len);
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		src_sin6 = (struct sockaddr_in6 *)src;
 		dst_sin6 = (struct sockaddr_in6 *)dst;
 		ip6 = mtod(mout, struct ip6_hdr *);
 		ip6->ip6_flow = htonl(0x60000000);
 		if (V_ip6_auto_flowlabel) {
 			ip6->ip6_flow |= (htonl(ip6_randomflowlabel()) & IPV6_FLOWLABEL_MASK);
 		}
 		ip6->ip6_hlim = MODULE_GLOBAL(ip6_defhlim);
 		if (port) {
 			ip6->ip6_nxt = IPPROTO_UDP;
 		} else {
 			ip6->ip6_nxt = IPPROTO_SCTP;
 		}
 		ip6->ip6_src = dst_sin6->sin6_addr;
 		ip6->ip6_dst = src_sin6->sin6_addr;
 		len = sizeof(struct ip6_hdr);
 		shout = (struct sctphdr *)((caddr_t)ip6 + len);
 		break;
 #endif
 	default:
 		len = 0;
 		shout = mtod(mout, struct sctphdr *);
 		break;
 	}
 #if defined(INET) || defined(INET6)
 	if (port) {
 		if (htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port)) == 0) {
 			sctp_m_freem(mout);
 			return;
 		}
 		udp = (struct udphdr *)shout;
 		udp->uh_sport = htons(SCTP_BASE_SYSCTL(sctp_udp_tunneling_port));
 		udp->uh_dport = port;
 		udp->uh_sum = 0;
 		udp->uh_ulen = htons((uint16_t)(sizeof(struct udphdr) +
 		    sizeof(struct sctphdr) +
 		    sizeof(struct sctp_chunkhdr) +
 		    cause_len + padding_len));
 		len += sizeof(struct udphdr);
 		shout = (struct sctphdr *)((caddr_t)shout + sizeof(struct udphdr));
 	} else {
 		udp = NULL;
 	}
 #endif
 	shout->src_port = sh->dest_port;
 	shout->dest_port = sh->src_port;
 	shout->checksum = 0;
 	if (vtag) {
 		shout->v_tag = htonl(vtag);
 	} else {
 		shout->v_tag = sh->v_tag;
 	}
 	len += sizeof(struct sctphdr);
 	ch = (struct sctp_chunkhdr *)((caddr_t)shout + sizeof(struct sctphdr));
 	ch->chunk_type = type;
 	if (vtag) {
 		ch->chunk_flags = 0;
 	} else {
 		ch->chunk_flags = SCTP_HAD_NO_TCB;
 	}
 	ch->chunk_length = htons((uint16_t)(sizeof(struct sctp_chunkhdr) + cause_len));
 	len += sizeof(struct sctp_chunkhdr);
 	len += cause_len + padding_len;
 
 	if (SCTP_GET_HEADER_FOR_OUTPUT(o_pak)) {
 		sctp_m_freem(mout);
 		return;
 	}
 	SCTP_ATTACH_CHAIN(o_pak, mout, len);
 	switch (dst->sa_family) {
 #ifdef INET
 	case AF_INET:
 		if (port) {
 			if (V_udp_cksum) {
 				udp->uh_sum = in_pseudo(ip->ip_src.s_addr, ip->ip_dst.s_addr, udp->uh_ulen + htons(IPPROTO_UDP));
 			} else {
 				udp->uh_sum = 0;
 			}
 		}
 		ip->ip_len = htons(len);
 		if (port) {
 			shout->checksum = sctp_calculate_cksum(mout, sizeof(struct ip) + sizeof(struct udphdr));
 			SCTP_STAT_INCR(sctps_sendswcrc);
 			if (V_udp_cksum) {
 				SCTP_ENABLE_UDP_CSUM(o_pak);
 			}
 		} else {
 			mout->m_pkthdr.csum_flags = CSUM_SCTP;
 			mout->m_pkthdr.csum_data = offsetof(struct sctphdr, checksum);
 			SCTP_STAT_INCR(sctps_sendhwcrc);
 		}
 #ifdef SCTP_PACKET_LOGGING
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LAST_PACKET_TRACING) {
 			sctp_packet_log(o_pak);
 		}
 #endif
 		SCTP_PROBE5(send, NULL, NULL, ip, NULL, shout);
 		SCTP_IP_OUTPUT(ret, o_pak, NULL, NULL, vrf_id);
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		ip6->ip6_plen = htons((uint16_t)(len - sizeof(struct ip6_hdr)));
 		if (port) {
 			shout->checksum = sctp_calculate_cksum(mout, sizeof(struct ip6_hdr) + sizeof(struct udphdr));
 			SCTP_STAT_INCR(sctps_sendswcrc);
 			if ((udp->uh_sum = in6_cksum(o_pak, IPPROTO_UDP, sizeof(struct ip6_hdr), len - sizeof(struct ip6_hdr))) == 0) {
 				udp->uh_sum = 0xffff;
 			}
 		} else {
 			mout->m_pkthdr.csum_flags = CSUM_SCTP_IPV6;
 			mout->m_pkthdr.csum_data = offsetof(struct sctphdr, checksum);
 			SCTP_STAT_INCR(sctps_sendhwcrc);
 		}
 #ifdef SCTP_PACKET_LOGGING
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_LAST_PACKET_TRACING) {
 			sctp_packet_log(o_pak);
 		}
 #endif
 		SCTP_PROBE5(send, NULL, NULL, ip6, NULL, shout);
 		SCTP_IP6_OUTPUT(ret, o_pak, NULL, NULL, NULL, vrf_id);
 		break;
 #endif
 	default:
 		SCTPDBG(SCTP_DEBUG_OUTPUT1, "Unknown protocol (TSNH) type %d\n",
 		    dst->sa_family);
 		sctp_m_freem(mout);
 		SCTP_LTRACE_ERR_RET_PKT(mout, NULL, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		return;
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT3, "return from send is %d\n", ret);
 	if (port) {
 		UDPSTAT_INC(udps_opackets);
 	}
 	SCTP_STAT_INCR(sctps_sendpackets);
 	SCTP_STAT_INCR_COUNTER64(sctps_outpackets);
 	SCTP_STAT_INCR_COUNTER64(sctps_outcontrolchunks);
 	if (ret) {
 		SCTP_STAT_INCR(sctps_senderrors);
 	}
 	return;
 }
 
 void
 sctp_send_shutdown_complete2(struct sockaddr *src, struct sockaddr *dst,
     struct sctphdr *sh,
     uint8_t mflowtype, uint32_t mflowid, uint16_t fibnum,
     uint32_t vrf_id, uint16_t port)
 {
 	sctp_send_resp_msg(src, dst, sh, 0, SCTP_SHUTDOWN_COMPLETE, NULL,
 	    mflowtype, mflowid, fibnum,
 	    vrf_id, port);
 }
 
 void
 sctp_send_hb(struct sctp_tcb *stcb, struct sctp_nets *net, int so_locked)
 {
 	struct sctp_tmit_chunk *chk;
 	struct sctp_heartbeat_chunk *hb;
 	struct timeval now;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if (net == NULL) {
 		return;
 	}
 	(void)SCTP_GETTIME_TIMEVAL(&now);
 	switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		break;
 #endif
 	default:
 		return;
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		SCTPDBG(SCTP_DEBUG_OUTPUT4, "Gak, can't get a chunk for hb\n");
 		return;
 	}
 
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_HEARTBEAT_REQUEST;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->send_size = sizeof(struct sctp_heartbeat_chunk);
 
 	chk->data = sctp_get_mbuf_for_msg(chk->send_size, 0, M_NOWAIT, 1, MT_HEADER);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, so_locked);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->whoTo = net;
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	/* Now we have a mbuf that we can fill in with the details */
 	hb = mtod(chk->data, struct sctp_heartbeat_chunk *);
 	memset(hb, 0, sizeof(struct sctp_heartbeat_chunk));
 	/* fill out chunk header */
 	hb->ch.chunk_type = SCTP_HEARTBEAT_REQUEST;
 	hb->ch.chunk_flags = 0;
 	hb->ch.chunk_length = htons(chk->send_size);
 	/* Fill out hb parameter */
 	hb->heartbeat.hb_info.ph.param_type = htons(SCTP_HEARTBEAT_INFO);
 	hb->heartbeat.hb_info.ph.param_length = htons(sizeof(struct sctp_heartbeat_info_param));
 	hb->heartbeat.hb_info.time_value_1 = (uint32_t)now.tv_sec;
 	hb->heartbeat.hb_info.time_value_2 = now.tv_usec;
 	/* Did our user request this one, put it in */
 	hb->heartbeat.hb_info.addr_family = (uint8_t)net->ro._l_addr.sa.sa_family;
 	hb->heartbeat.hb_info.addr_len = net->ro._l_addr.sa.sa_len;
 	if (net->dest_state & SCTP_ADDR_UNCONFIRMED) {
 		/*
 		 * we only take from the entropy pool if the address is not
 		 * confirmed.
 		 */
 		net->heartbeat_random1 = hb->heartbeat.hb_info.random_value1 = sctp_select_initial_TSN(&stcb->sctp_ep->sctp_ep);
 		net->heartbeat_random2 = hb->heartbeat.hb_info.random_value2 = sctp_select_initial_TSN(&stcb->sctp_ep->sctp_ep);
 	} else {
 		net->heartbeat_random1 = hb->heartbeat.hb_info.random_value1 = 0;
 		net->heartbeat_random2 = hb->heartbeat.hb_info.random_value2 = 0;
 	}
 	switch (net->ro._l_addr.sa.sa_family) {
 #ifdef INET
 	case AF_INET:
 		memcpy(hb->heartbeat.hb_info.address,
 		    &net->ro._l_addr.sin.sin_addr,
 		    sizeof(net->ro._l_addr.sin.sin_addr));
 		break;
 #endif
 #ifdef INET6
 	case AF_INET6:
 		memcpy(hb->heartbeat.hb_info.address,
 		    &net->ro._l_addr.sin6.sin6_addr,
 		    sizeof(net->ro._l_addr.sin6.sin6_addr));
 		break;
 #endif
 	default:
 		if (chk->data) {
 			sctp_m_freem(chk->data);
 			chk->data = NULL;
 		}
 		sctp_free_a_chunk(stcb, chk, so_locked);
 		return;
 		break;
 	}
 	net->hb_responded = 0;
 	TAILQ_INSERT_TAIL(&stcb->asoc.control_send_queue, chk, sctp_next);
 	stcb->asoc.ctrl_queue_cnt++;
 	SCTP_STAT_INCR(sctps_sendheartbeat);
 	return;
 }
 
 void
 sctp_send_ecn_echo(struct sctp_tcb *stcb, struct sctp_nets *net,
     uint32_t high_tsn)
 {
 	struct sctp_association *asoc;
 	struct sctp_ecne_chunk *ecne;
 	struct sctp_tmit_chunk *chk;
 
 	if (net == NULL) {
 		return;
 	}
 	asoc = &stcb->asoc;
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if ((chk->rec.chunk_id.id == SCTP_ECN_ECHO) && (net == chk->whoTo)) {
 			/* found a previous ECN_ECHO update it if needed */
 			uint32_t cnt, ctsn;
 
 			ecne = mtod(chk->data, struct sctp_ecne_chunk *);
 			ctsn = ntohl(ecne->tsn);
 			if (SCTP_TSN_GT(high_tsn, ctsn)) {
 				ecne->tsn = htonl(high_tsn);
 				SCTP_STAT_INCR(sctps_queue_upd_ecne);
 			}
 			cnt = ntohl(ecne->num_pkts_since_cwr);
 			cnt++;
 			ecne->num_pkts_since_cwr = htonl(cnt);
 			return;
 		}
 	}
 	/* nope could not find one to update so we must build one */
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		return;
 	}
 	SCTP_STAT_INCR(sctps_queue_upd_ecne);
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_ECN_ECHO;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->send_size = sizeof(struct sctp_ecne_chunk);
 	chk->data = sctp_get_mbuf_for_msg(chk->send_size, 0, M_NOWAIT, 1, MT_HEADER);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->whoTo = net;
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 
 	stcb->asoc.ecn_echo_cnt_onq++;
 	ecne = mtod(chk->data, struct sctp_ecne_chunk *);
 	ecne->ch.chunk_type = SCTP_ECN_ECHO;
 	ecne->ch.chunk_flags = 0;
 	ecne->ch.chunk_length = htons(sizeof(struct sctp_ecne_chunk));
 	ecne->tsn = htonl(high_tsn);
 	ecne->num_pkts_since_cwr = htonl(1);
 	TAILQ_INSERT_HEAD(&stcb->asoc.control_send_queue, chk, sctp_next);
 	asoc->ctrl_queue_cnt++;
 }
 
 void
 sctp_send_packet_dropped(struct sctp_tcb *stcb, struct sctp_nets *net,
     struct mbuf *m, int len, int iphlen, int bad_crc)
 {
 	struct sctp_association *asoc;
 	struct sctp_pktdrop_chunk *drp;
 	struct sctp_tmit_chunk *chk;
 	uint8_t *datap;
 	int was_trunc = 0;
 	int fullsz = 0;
 	long spc;
 	int offset;
 	struct sctp_chunkhdr *ch, chunk_buf;
 	unsigned int chk_length;
 
 	if (!stcb) {
 		return;
 	}
 	asoc = &stcb->asoc;
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if (asoc->pktdrop_supported == 0) {
 		/*-
 		 * peer must declare support before I send one.
 		 */
 		return;
 	}
 	if (stcb->sctp_socket == NULL) {
 		return;
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_PACKET_DROPPED;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	len -= iphlen;
 	chk->send_size = len;
 	/* Validate that we do not have an ABORT in here. */
 	offset = iphlen + sizeof(struct sctphdr);
 	ch = (struct sctp_chunkhdr *)sctp_m_getptr(m, offset,
 	    sizeof(*ch), (uint8_t *)&chunk_buf);
 	while (ch != NULL) {
 		chk_length = ntohs(ch->chunk_length);
 		if (chk_length < sizeof(*ch)) {
 			/* break to abort land */
 			break;
 		}
 		switch (ch->chunk_type) {
 		case SCTP_PACKET_DROPPED:
 		case SCTP_ABORT_ASSOCIATION:
 		case SCTP_INITIATION_ACK:
 			/**
 			 * We don't respond with an PKT-DROP to an ABORT
 			 * or PKT-DROP. We also do not respond to an
 			 * INIT-ACK, because we can't know if the initiation
 			 * tag is correct or not.
 			 */
 			sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 			return;
 		default:
 			break;
 		}
 		offset += SCTP_SIZE32(chk_length);
 		ch = (struct sctp_chunkhdr *)sctp_m_getptr(m, offset,
 		    sizeof(*ch), (uint8_t *)&chunk_buf);
 	}
 
 	if ((len + SCTP_MAX_OVERHEAD + sizeof(struct sctp_pktdrop_chunk)) >
 	    min(stcb->asoc.smallest_mtu, MCLBYTES)) {
 		/*
 		 * only send 1 mtu worth, trim off the excess on the end.
 		 */
 		fullsz = len;
 		len = min(stcb->asoc.smallest_mtu, MCLBYTES) - SCTP_MAX_OVERHEAD;
 		was_trunc = 1;
 	}
 	chk->asoc = &stcb->asoc;
 	chk->data = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (chk->data == NULL) {
 jump_out:
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	drp = mtod(chk->data, struct sctp_pktdrop_chunk *);
 	if (drp == NULL) {
 		sctp_m_freem(chk->data);
 		chk->data = NULL;
 		goto jump_out;
 	}
 	chk->book_size = SCTP_SIZE32((chk->send_size + sizeof(struct sctp_pktdrop_chunk) +
 	    sizeof(struct sctphdr) + SCTP_MED_OVERHEAD));
 	chk->book_size_scale = 0;
 	if (was_trunc) {
 		drp->ch.chunk_flags = SCTP_PACKET_TRUNCATED;
 		drp->trunc_len = htons(fullsz);
 		/*
 		 * Len is already adjusted to size minus overhead above take
 		 * out the pkt_drop chunk itself from it.
 		 */
 		chk->send_size = (uint16_t)(len - sizeof(struct sctp_pktdrop_chunk));
 		len = chk->send_size;
 	} else {
 		/* no truncation needed */
 		drp->ch.chunk_flags = 0;
 		drp->trunc_len = htons(0);
 	}
 	if (bad_crc) {
 		drp->ch.chunk_flags |= SCTP_BADCRC;
 	}
 	chk->send_size += sizeof(struct sctp_pktdrop_chunk);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	if (net) {
 		/* we should hit here */
 		chk->whoTo = net;
 		atomic_add_int(&chk->whoTo->ref_count, 1);
 	} else {
 		chk->whoTo = NULL;
 	}
 	drp->ch.chunk_type = SCTP_PACKET_DROPPED;
 	drp->ch.chunk_length = htons(chk->send_size);
 	spc = SCTP_SB_LIMIT_RCV(stcb->sctp_socket);
 	if (spc < 0) {
 		spc = 0;
 	}
 	drp->bottle_bw = htonl(spc);
 	if (asoc->my_rwnd) {
 		drp->current_onq = htonl(asoc->size_on_reasm_queue +
 		    asoc->size_on_all_streams +
 		    asoc->my_rwnd_control_len +
 		    SCTP_SBAVAIL(&stcb->sctp_socket->so_rcv));
 	} else {
 		/*-
 		 * If my rwnd is 0, possibly from mbuf depletion as well as
 		 * space used, tell the peer there is NO space aka onq == bw
 		 */
 		drp->current_onq = htonl(spc);
 	}
 	drp->reserved = 0;
 	datap = drp->data;
 	m_copydata(m, iphlen, len, (caddr_t)datap);
 	TAILQ_INSERT_TAIL(&stcb->asoc.control_send_queue, chk, sctp_next);
 	asoc->ctrl_queue_cnt++;
 }
 
 void
 sctp_send_cwr(struct sctp_tcb *stcb, struct sctp_nets *net, uint32_t high_tsn, uint8_t override)
 {
 	struct sctp_association *asoc;
 	struct sctp_cwr_chunk *cwr;
 	struct sctp_tmit_chunk *chk;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	if (net == NULL) {
 		return;
 	}
 	asoc = &stcb->asoc;
 	TAILQ_FOREACH(chk, &asoc->control_send_queue, sctp_next) {
 		if ((chk->rec.chunk_id.id == SCTP_ECN_CWR) && (net == chk->whoTo)) {
 			/*
 			 * found a previous CWR queued to same destination
 			 * update it if needed
 			 */
 			uint32_t ctsn;
 
 			cwr = mtod(chk->data, struct sctp_cwr_chunk *);
 			ctsn = ntohl(cwr->tsn);
 			if (SCTP_TSN_GT(high_tsn, ctsn)) {
 				cwr->tsn = htonl(high_tsn);
 			}
 			if (override & SCTP_CWR_REDUCE_OVERRIDE) {
 				/* Make sure override is carried */
 				cwr->ch.chunk_flags |= SCTP_CWR_REDUCE_OVERRIDE;
 			}
 			return;
 		}
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_ECN_CWR;
 	chk->rec.chunk_id.can_take_data = 1;
 	chk->flags = 0;
 	chk->asoc = asoc;
 	chk->send_size = sizeof(struct sctp_cwr_chunk);
 	chk->data = sctp_get_mbuf_for_msg(chk->send_size, 0, M_NOWAIT, 1, MT_HEADER);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_NOT_LOCKED);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	chk->whoTo = net;
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	cwr = mtod(chk->data, struct sctp_cwr_chunk *);
 	cwr->ch.chunk_type = SCTP_ECN_CWR;
 	cwr->ch.chunk_flags = override;
 	cwr->ch.chunk_length = htons(sizeof(struct sctp_cwr_chunk));
 	cwr->tsn = htonl(high_tsn);
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue, chk, sctp_next);
 	asoc->ctrl_queue_cnt++;
 }
 
 static int
 sctp_add_stream_reset_out(struct sctp_tcb *stcb, struct sctp_tmit_chunk *chk,
     uint32_t seq, uint32_t resp_seq, uint32_t last_sent)
 {
 	uint16_t len, old_len, i;
 	struct sctp_stream_reset_out_request *req_out;
 	struct sctp_chunkhdr *ch;
 	int at;
 	int number_entries = 0;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 	/* get to new offset for the param. */
 	req_out = (struct sctp_stream_reset_out_request *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 		if ((stcb->asoc.strmout[i].state == SCTP_STREAM_RESET_PENDING) &&
 		    (stcb->asoc.strmout[i].chunks_on_queues == 0) &&
 		    TAILQ_EMPTY(&stcb->asoc.strmout[i].outqueue)) {
 			number_entries++;
 		}
 	}
 	if (number_entries == 0) {
 		return (0);
 	}
 	if (number_entries == stcb->asoc.streamoutcnt) {
 		number_entries = 0;
 	}
 	if (number_entries > SCTP_MAX_STREAMS_AT_ONCE_RESET) {
 		number_entries = SCTP_MAX_STREAMS_AT_ONCE_RESET;
 	}
 	len = (uint16_t)(sizeof(struct sctp_stream_reset_out_request) + (sizeof(uint16_t) * number_entries));
 	req_out->ph.param_type = htons(SCTP_STR_RESET_OUT_REQUEST);
 	req_out->ph.param_length = htons(len);
 	req_out->request_seq = htonl(seq);
 	req_out->response_seq = htonl(resp_seq);
 	req_out->send_reset_at_tsn = htonl(last_sent);
 	at = 0;
 	if (number_entries) {
 		for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 			if ((stcb->asoc.strmout[i].state == SCTP_STREAM_RESET_PENDING) &&
 			    (stcb->asoc.strmout[i].chunks_on_queues == 0) &&
 			    TAILQ_EMPTY(&stcb->asoc.strmout[i].outqueue)) {
 				req_out->list_of_streams[at] = htons(i);
 				at++;
 				stcb->asoc.strmout[i].state = SCTP_STREAM_RESET_IN_FLIGHT;
 				if (at >= number_entries) {
 					break;
 				}
 			}
 		}
 	} else {
 		for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 			stcb->asoc.strmout[i].state = SCTP_STREAM_RESET_IN_FLIGHT;
 		}
 	}
 	if (SCTP_SIZE32(len) > len) {
 		/*-
 		 * Need to worry about the pad we may end up adding to the
 		 * end. This is easy since the struct is either aligned to 4
 		 * bytes or 2 bytes off.
 		 */
 		req_out->list_of_streams[number_entries] = 0;
 	}
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->book_size = len + old_len;
 	chk->book_size_scale = 0;
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	return (1);
 }
 
 static void
 sctp_add_stream_reset_in(struct sctp_tmit_chunk *chk,
     int number_entries, uint16_t *list,
     uint32_t seq)
 {
 	uint16_t len, old_len, i;
 	struct sctp_stream_reset_in_request *req_in;
 	struct sctp_chunkhdr *ch;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	req_in = (struct sctp_stream_reset_in_request *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = (uint16_t)(sizeof(struct sctp_stream_reset_in_request) + (sizeof(uint16_t) * number_entries));
 	req_in->ph.param_type = htons(SCTP_STR_RESET_IN_REQUEST);
 	req_in->ph.param_length = htons(len);
 	req_in->request_seq = htonl(seq);
 	if (number_entries) {
 		for (i = 0; i < number_entries; i++) {
 			req_in->list_of_streams[i] = htons(list[i]);
 		}
 	}
 	if (SCTP_SIZE32(len) > len) {
 		/*-
 		 * Need to worry about the pad we may end up adding to the
 		 * end. This is easy since the struct is either aligned to 4
 		 * bytes or 2 bytes off.
 		 */
 		req_in->list_of_streams[number_entries] = 0;
 	}
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->book_size = len + old_len;
 	chk->book_size_scale = 0;
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	return;
 }
 
 static void
 sctp_add_stream_reset_tsn(struct sctp_tmit_chunk *chk,
     uint32_t seq)
 {
 	uint16_t len, old_len;
 	struct sctp_stream_reset_tsn_request *req_tsn;
 	struct sctp_chunkhdr *ch;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	req_tsn = (struct sctp_stream_reset_tsn_request *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = sizeof(struct sctp_stream_reset_tsn_request);
 	req_tsn->ph.param_type = htons(SCTP_STR_RESET_TSN_REQUEST);
 	req_tsn->ph.param_length = htons(len);
 	req_tsn->request_seq = htonl(seq);
 
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->send_size = len + old_len;
 	chk->book_size = SCTP_SIZE32(chk->send_size);
 	chk->book_size_scale = 0;
 	SCTP_BUF_LEN(chk->data) = SCTP_SIZE32(chk->send_size);
 	return;
 }
 
 void
 sctp_add_stream_reset_result(struct sctp_tmit_chunk *chk,
     uint32_t resp_seq, uint32_t result)
 {
 	uint16_t len, old_len;
 	struct sctp_stream_reset_response *resp;
 	struct sctp_chunkhdr *ch;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	resp = (struct sctp_stream_reset_response *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = sizeof(struct sctp_stream_reset_response);
 	resp->ph.param_type = htons(SCTP_STR_RESET_RESPONSE);
 	resp->ph.param_length = htons(len);
 	resp->response_seq = htonl(resp_seq);
 	resp->result = ntohl(result);
 
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->book_size = len + old_len;
 	chk->book_size_scale = 0;
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	return;
 }
 
 void
 sctp_send_deferred_reset_response(struct sctp_tcb *stcb,
     struct sctp_stream_reset_list *ent,
     int response)
 {
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk;
 	struct sctp_chunkhdr *ch;
 
 	asoc = &stcb->asoc;
 
 	/*
 	 * Reset our last reset action to the new one IP -> response
 	 * (PERFORMED probably). This assures that if we fail to send, a
 	 * retran from the peer will get the new response.
 	 */
 	asoc->last_reset_action[0] = response;
 	if (asoc->stream_reset_outstanding) {
 		return;
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return;
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_STREAM_RESET;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->book_size = sizeof(struct sctp_chunkhdr);
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	chk->book_size_scale = 0;
 	chk->data = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_LOCKED);
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return;
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 	/* setup chunk parameters */
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	if (stcb->asoc.alternate) {
 		chk->whoTo = stcb->asoc.alternate;
 	} else {
 		chk->whoTo = stcb->asoc.primary_destination;
 	}
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	ch->chunk_type = SCTP_STREAM_RESET;
 	ch->chunk_flags = 0;
 	ch->chunk_length = htons(chk->book_size);
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	sctp_add_stream_reset_result(chk, ent->seq, response);
 	/* insert the chunk for sending */
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue,
 	    chk,
 	    sctp_next);
 	asoc->ctrl_queue_cnt++;
 }
 
 void
 sctp_add_stream_reset_result_tsn(struct sctp_tmit_chunk *chk,
     uint32_t resp_seq, uint32_t result,
     uint32_t send_una, uint32_t recv_next)
 {
 	uint16_t len, old_len;
 	struct sctp_stream_reset_response_tsn *resp;
 	struct sctp_chunkhdr *ch;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	resp = (struct sctp_stream_reset_response_tsn *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = sizeof(struct sctp_stream_reset_response_tsn);
 	resp->ph.param_type = htons(SCTP_STR_RESET_RESPONSE);
 	resp->ph.param_length = htons(len);
 	resp->response_seq = htonl(resp_seq);
 	resp->result = htonl(result);
 	resp->senders_next_tsn = htonl(send_una);
 	resp->receivers_next_tsn = htonl(recv_next);
 
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->book_size = len + old_len;
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	chk->book_size_scale = 0;
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	return;
 }
 
 static void
 sctp_add_an_out_stream(struct sctp_tmit_chunk *chk,
     uint32_t seq,
     uint16_t adding)
 {
 	uint16_t len, old_len;
 	struct sctp_chunkhdr *ch;
 	struct sctp_stream_reset_add_strm *addstr;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	addstr = (struct sctp_stream_reset_add_strm *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = sizeof(struct sctp_stream_reset_add_strm);
 
 	/* Fill it out. */
 	addstr->ph.param_type = htons(SCTP_STR_RESET_ADD_OUT_STREAMS);
 	addstr->ph.param_length = htons(len);
 	addstr->request_seq = htonl(seq);
 	addstr->number_of_streams = htons(adding);
 	addstr->reserved = 0;
 
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->send_size = len + old_len;
 	chk->book_size = SCTP_SIZE32(chk->send_size);
 	chk->book_size_scale = 0;
 	SCTP_BUF_LEN(chk->data) = SCTP_SIZE32(chk->send_size);
 	return;
 }
 
 static void
 sctp_add_an_in_stream(struct sctp_tmit_chunk *chk,
     uint32_t seq,
     uint16_t adding)
 {
 	uint16_t len, old_len;
 	struct sctp_chunkhdr *ch;
 	struct sctp_stream_reset_add_strm *addstr;
 
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	old_len = len = SCTP_SIZE32(ntohs(ch->chunk_length));
 
 	/* get to new offset for the param. */
 	addstr = (struct sctp_stream_reset_add_strm *)((caddr_t)ch + len);
 	/* now how long will this param be? */
 	len = sizeof(struct sctp_stream_reset_add_strm);
 	/* Fill it out. */
 	addstr->ph.param_type = htons(SCTP_STR_RESET_ADD_IN_STREAMS);
 	addstr->ph.param_length = htons(len);
 	addstr->request_seq = htonl(seq);
 	addstr->number_of_streams = htons(adding);
 	addstr->reserved = 0;
 
 	/* now fix the chunk length */
 	ch->chunk_length = htons(len + old_len);
 	chk->send_size = len + old_len;
 	chk->book_size = SCTP_SIZE32(chk->send_size);
 	chk->book_size_scale = 0;
 	SCTP_BUF_LEN(chk->data) = SCTP_SIZE32(chk->send_size);
 	return;
 }
 
 int
 sctp_send_stream_reset_out_if_possible(struct sctp_tcb *stcb, int so_locked)
 {
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk;
 	struct sctp_chunkhdr *ch;
 	uint32_t seq;
 
 	asoc = &stcb->asoc;
 	asoc->trigger_reset = 0;
 	if (asoc->stream_reset_outstanding) {
 		return (EALREADY);
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_STREAM_RESET;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->book_size = sizeof(struct sctp_chunkhdr);
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	chk->book_size_scale = 0;
 	chk->data = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, so_locked);
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 
 	/* setup chunk parameters */
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	if (stcb->asoc.alternate) {
 		chk->whoTo = stcb->asoc.alternate;
 	} else {
 		chk->whoTo = stcb->asoc.primary_destination;
 	}
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	ch->chunk_type = SCTP_STREAM_RESET;
 	ch->chunk_flags = 0;
 	ch->chunk_length = htons(chk->book_size);
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 	seq = stcb->asoc.str_reset_seq_out;
 	if (sctp_add_stream_reset_out(stcb, chk, seq, (stcb->asoc.str_reset_seq_in - 1), (stcb->asoc.sending_seq - 1))) {
 		seq++;
 		asoc->stream_reset_outstanding++;
 	} else {
 		m_freem(chk->data);
 		chk->data = NULL;
 		sctp_free_a_chunk(stcb, chk, so_locked);
 		return (ENOENT);
 	}
 	asoc->str_reset = chk;
 	/* insert the chunk for sending */
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue,
 	    chk,
 	    sctp_next);
 	asoc->ctrl_queue_cnt++;
 
 	if (stcb->asoc.send_sack) {
 		sctp_send_sack(stcb, so_locked);
 	}
 	sctp_timer_start(SCTP_TIMER_TYPE_STRRESET, stcb->sctp_ep, stcb, chk->whoTo);
 	return (0);
 }
 
 int
 sctp_send_str_reset_req(struct sctp_tcb *stcb,
     uint16_t number_entries, uint16_t *list,
     uint8_t send_in_req,
     uint8_t send_tsn_req,
     uint8_t add_stream,
     uint16_t adding_o,
     uint16_t adding_i, uint8_t peer_asked)
 {
 	struct sctp_association *asoc;
 	struct sctp_tmit_chunk *chk;
 	struct sctp_chunkhdr *ch;
 	int can_send_out_req = 0;
 	uint32_t seq;
 
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	asoc = &stcb->asoc;
 	if (asoc->stream_reset_outstanding) {
 		/*-
 		 * Already one pending, must get ACK back to clear the flag.
 		 */
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EBUSY);
 		return (EBUSY);
 	}
 	if ((send_in_req == 0) && (send_tsn_req == 0) &&
 	    (add_stream == 0)) {
 		/* nothing to do */
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		return (EINVAL);
 	}
 	if (send_tsn_req && send_in_req) {
 		/* error, can't do that */
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 		return (EINVAL);
 	} else if (send_in_req) {
 		can_send_out_req = 1;
 	}
 	if (number_entries > (MCLBYTES -
 	    SCTP_MIN_OVERHEAD -
 	    sizeof(struct sctp_chunkhdr) -
 	    sizeof(struct sctp_stream_reset_out_request)) /
 	    sizeof(uint16_t)) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	sctp_alloc_a_chunk(stcb, chk);
 	if (chk == NULL) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	chk->copy_by_ref = 0;
 	chk->rec.chunk_id.id = SCTP_STREAM_RESET;
 	chk->rec.chunk_id.can_take_data = 0;
 	chk->flags = 0;
 	chk->asoc = &stcb->asoc;
 	chk->book_size = sizeof(struct sctp_chunkhdr);
 	chk->send_size = SCTP_SIZE32(chk->book_size);
 	chk->book_size_scale = 0;
 	chk->data = sctp_get_mbuf_for_msg(MCLBYTES, 0, M_NOWAIT, 1, MT_DATA);
 	if (chk->data == NULL) {
 		sctp_free_a_chunk(stcb, chk, SCTP_SO_LOCKED);
 		SCTP_LTRACE_ERR_RET(NULL, stcb, NULL, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		return (ENOMEM);
 	}
 	SCTP_BUF_RESV_UF(chk->data, SCTP_MIN_OVERHEAD);
 
 	/* setup chunk parameters */
 	chk->sent = SCTP_DATAGRAM_UNSENT;
 	chk->snd_count = 0;
 	if (stcb->asoc.alternate) {
 		chk->whoTo = stcb->asoc.alternate;
 	} else {
 		chk->whoTo = stcb->asoc.primary_destination;
 	}
 	atomic_add_int(&chk->whoTo->ref_count, 1);
 	ch = mtod(chk->data, struct sctp_chunkhdr *);
 	ch->chunk_type = SCTP_STREAM_RESET;
 	ch->chunk_flags = 0;
 	ch->chunk_length = htons(chk->book_size);
 	SCTP_BUF_LEN(chk->data) = chk->send_size;
 
 	seq = stcb->asoc.str_reset_seq_out;
 	if (can_send_out_req) {
 		int ret;
 
 		ret = sctp_add_stream_reset_out(stcb, chk, seq, (stcb->asoc.str_reset_seq_in - 1), (stcb->asoc.sending_seq - 1));
 		if (ret) {
 			seq++;
 			asoc->stream_reset_outstanding++;
 		}
 	}
 	if ((add_stream & 1) &&
 	    ((stcb->asoc.strm_realoutsize - stcb->asoc.streamoutcnt) < adding_o)) {
 		/* Need to allocate more */
 		struct sctp_stream_out *oldstream;
 		struct sctp_stream_queue_pending *sp, *nsp;
 		int i;
 #if defined(SCTP_DETAILED_STR_STATS)
 		int j;
 #endif
 
 		oldstream = stcb->asoc.strmout;
 		/* get some more */
 		SCTP_MALLOC(stcb->asoc.strmout, struct sctp_stream_out *,
 		    (stcb->asoc.streamoutcnt + adding_o) * sizeof(struct sctp_stream_out),
 		    SCTP_M_STRMO);
 		if (stcb->asoc.strmout == NULL) {
 			uint8_t x;
 
 			stcb->asoc.strmout = oldstream;
 			/* Turn off the bit */
 			x = add_stream & 0xfe;
 			add_stream = x;
 			goto skip_stuff;
 		}
 		/*
 		 * Ok now we proceed with copying the old out stuff and
 		 * initializing the new stuff.
 		 */
 		stcb->asoc.ss_functions.sctp_ss_clear(stcb, &stcb->asoc, false);
 		for (i = 0; i < stcb->asoc.streamoutcnt; i++) {
 			TAILQ_INIT(&stcb->asoc.strmout[i].outqueue);
 			/* FIX ME FIX ME */
 			/*
 			 * This should be a SS_COPY operation FIX ME STREAM
 			 * SCHEDULER EXPERT
 			 */
 			stcb->asoc.ss_functions.sctp_ss_init_stream(stcb, &stcb->asoc.strmout[i], &oldstream[i]);
 			stcb->asoc.strmout[i].chunks_on_queues = oldstream[i].chunks_on_queues;
 #if defined(SCTP_DETAILED_STR_STATS)
 			for (j = 0; j < SCTP_PR_SCTP_MAX + 1; j++) {
 				stcb->asoc.strmout[i].abandoned_sent[j] = oldstream[i].abandoned_sent[j];
 				stcb->asoc.strmout[i].abandoned_unsent[j] = oldstream[i].abandoned_unsent[j];
 			}
 #else
 			stcb->asoc.strmout[i].abandoned_sent[0] = oldstream[i].abandoned_sent[0];
 			stcb->asoc.strmout[i].abandoned_unsent[0] = oldstream[i].abandoned_unsent[0];
 #endif
 			stcb->asoc.strmout[i].next_mid_ordered = oldstream[i].next_mid_ordered;
 			stcb->asoc.strmout[i].next_mid_unordered = oldstream[i].next_mid_unordered;
 			stcb->asoc.strmout[i].last_msg_incomplete = oldstream[i].last_msg_incomplete;
 			stcb->asoc.strmout[i].sid = i;
 			stcb->asoc.strmout[i].state = oldstream[i].state;
 			/* now anything on those queues? */
 			TAILQ_FOREACH_SAFE(sp, &oldstream[i].outqueue, next, nsp) {
 				TAILQ_REMOVE(&oldstream[i].outqueue, sp, next);
 				TAILQ_INSERT_TAIL(&stcb->asoc.strmout[i].outqueue, sp, next);
 			}
 		}
 		/* now the new streams */
 		stcb->asoc.ss_functions.sctp_ss_init(stcb, &stcb->asoc);
 		for (i = stcb->asoc.streamoutcnt; i < (stcb->asoc.streamoutcnt + adding_o); i++) {
 			TAILQ_INIT(&stcb->asoc.strmout[i].outqueue);
 			stcb->asoc.strmout[i].chunks_on_queues = 0;
 #if defined(SCTP_DETAILED_STR_STATS)
 			for (j = 0; j < SCTP_PR_SCTP_MAX + 1; j++) {
 				stcb->asoc.strmout[i].abandoned_sent[j] = 0;
 				stcb->asoc.strmout[i].abandoned_unsent[j] = 0;
 			}
 #else
 			stcb->asoc.strmout[i].abandoned_sent[0] = 0;
 			stcb->asoc.strmout[i].abandoned_unsent[0] = 0;
 #endif
 			stcb->asoc.strmout[i].next_mid_ordered = 0;
 			stcb->asoc.strmout[i].next_mid_unordered = 0;
 			stcb->asoc.strmout[i].sid = i;
 			stcb->asoc.strmout[i].last_msg_incomplete = 0;
 			stcb->asoc.ss_functions.sctp_ss_init_stream(stcb, &stcb->asoc.strmout[i], NULL);
 			stcb->asoc.strmout[i].state = SCTP_STREAM_CLOSED;
 		}
 		stcb->asoc.strm_realoutsize = stcb->asoc.streamoutcnt + adding_o;
 		SCTP_FREE(oldstream, SCTP_M_STRMO);
 	}
 skip_stuff:
 	if ((add_stream & 1) && (adding_o > 0)) {
 		asoc->strm_pending_add_size = adding_o;
 		asoc->peer_req_out = peer_asked;
 		sctp_add_an_out_stream(chk, seq, adding_o);
 		seq++;
 		asoc->stream_reset_outstanding++;
 	}
 	if ((add_stream & 2) && (adding_i > 0)) {
 		sctp_add_an_in_stream(chk, seq, adding_i);
 		seq++;
 		asoc->stream_reset_outstanding++;
 	}
 	if (send_in_req) {
 		sctp_add_stream_reset_in(chk, number_entries, list, seq);
 		seq++;
 		asoc->stream_reset_outstanding++;
 	}
 	if (send_tsn_req) {
 		sctp_add_stream_reset_tsn(chk, seq);
 		asoc->stream_reset_outstanding++;
 	}
 	asoc->str_reset = chk;
 	/* insert the chunk for sending */
 	TAILQ_INSERT_TAIL(&asoc->control_send_queue,
 	    chk,
 	    sctp_next);
 	asoc->ctrl_queue_cnt++;
 	if (stcb->asoc.send_sack) {
 		sctp_send_sack(stcb, SCTP_SO_LOCKED);
 	}
 	sctp_timer_start(SCTP_TIMER_TYPE_STRRESET, stcb->sctp_ep, stcb, chk->whoTo);
 	return (0);
 }
 
 void
 sctp_send_abort(struct mbuf *m, int iphlen, struct sockaddr *src, struct sockaddr *dst,
     struct sctphdr *sh, uint32_t vtag, struct mbuf *cause,
     uint8_t mflowtype, uint32_t mflowid, uint16_t fibnum,
     uint32_t vrf_id, uint16_t port)
 {
 	/* Don't respond to an ABORT with an ABORT. */
 	if (sctp_is_there_an_abort_here(m, iphlen, &vtag)) {
 		if (cause)
 			sctp_m_freem(cause);
 		return;
 	}
 	sctp_send_resp_msg(src, dst, sh, vtag, SCTP_ABORT_ASSOCIATION, cause,
 	    mflowtype, mflowid, fibnum,
 	    vrf_id, port);
 	return;
 }
 
 void
 sctp_send_operr_to(struct sockaddr *src, struct sockaddr *dst,
     struct sctphdr *sh, uint32_t vtag, struct mbuf *cause,
     uint8_t mflowtype, uint32_t mflowid, uint16_t fibnum,
     uint32_t vrf_id, uint16_t port)
 {
 	sctp_send_resp_msg(src, dst, sh, vtag, SCTP_OPERATION_ERROR, cause,
 	    mflowtype, mflowid, fibnum,
 	    vrf_id, port);
 	return;
 }
 
 static struct mbuf *
 sctp_copy_resume(struct uio *uio,
     int max_send_len,
     int user_marks_eor,
     int *error,
     uint32_t *sndout,
     struct mbuf **new_tail)
 {
 	struct mbuf *m;
 
 	m = m_uiotombuf(uio, M_WAITOK, max_send_len, 0,
 	    (M_PKTHDR | (user_marks_eor ? M_EOR : 0)));
 	if (m == NULL) {
 		/* The only possible error is EFAULT. */
 		SCTP_LTRACE_ERR_RET(NULL, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		*error = EFAULT;
 	} else {
 		*sndout = m_length(m, NULL);
 		*new_tail = m_last(m);
 	}
 	return (m);
 }
 
 static int
 sctp_copy_one(struct sctp_stream_queue_pending *sp,
     struct uio *uio,
     int resv_upfront)
 {
 	sp->data = m_uiotombuf(uio, M_WAITOK, sp->length, resv_upfront, 0);
 	if (sp->data == NULL) {
 		/* The only possible error is EFAULT. */
 		SCTP_LTRACE_ERR_RET(NULL, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EFAULT);
 		return (EFAULT);
 	}
 	sp->tail_mbuf = m_last(sp->data);
 	return (0);
 }
 
 static struct sctp_stream_queue_pending *
 sctp_copy_it_in(struct sctp_tcb *stcb,
     struct sctp_association *asoc,
     struct sctp_nonpad_sndrcvinfo *srcv,
     struct uio *uio,
     struct sctp_nets *net,
     ssize_t max_send_len,
     int user_marks_eor,
     int *error)
 {
 
 	/*-
 	 * This routine must be very careful in its work. Protocol
 	 * processing is up and running so care must be taken to spl...()
 	 * when you need to do something that may effect the stcb/asoc. The
 	 * sb is locked however. When data is copied the protocol processing
 	 * should be enabled since this is a slower operation...
 	 */
 	struct sctp_stream_queue_pending *sp;
 	int resv_in_first;
 
 	*error = 0;
 	sctp_alloc_a_strmoq(stcb, sp);
 	if (sp == NULL) {
 		SCTP_LTRACE_ERR_RET(NULL, stcb, net, SCTP_FROM_SCTP_OUTPUT, ENOMEM);
 		*error = ENOMEM;
 		goto out_now;
 	}
 	sp->act_flags = 0;
 	sp->sender_all_done = 0;
 	sp->sinfo_flags = srcv->sinfo_flags;
 	sp->timetolive = srcv->sinfo_timetolive;
 	sp->ppid = srcv->sinfo_ppid;
 	sp->context = srcv->sinfo_context;
 	sp->fsn = 0;
 	(void)SCTP_GETTIME_TIMEVAL(&sp->ts);
 	sp->sid = srcv->sinfo_stream;
 	sp->length = (uint32_t)min(uio->uio_resid, max_send_len);
 	if ((sp->length == (uint32_t)uio->uio_resid) &&
 	    ((user_marks_eor == 0) ||
 	    (srcv->sinfo_flags & SCTP_EOF) ||
 	    (user_marks_eor && (srcv->sinfo_flags & SCTP_EOR)))) {
 		sp->msg_is_complete = 1;
 	} else {
 		sp->msg_is_complete = 0;
 	}
 	sp->sender_all_done = 0;
 	sp->some_taken = 0;
 	sp->put_last_out = 0;
 	resv_in_first = SCTP_DATA_CHUNK_OVERHEAD(stcb);
 	sp->data = sp->tail_mbuf = NULL;
 	if (sp->length == 0) {
 		goto skip_copy;
 	}
 	if (srcv->sinfo_keynumber_valid) {
 		sp->auth_keyid = srcv->sinfo_keynumber;
 	} else {
 		sp->auth_keyid = stcb->asoc.authinfo.active_keyid;
 	}
 	if (sctp_auth_is_required_chunk(SCTP_DATA, stcb->asoc.peer_auth_chunks)) {
 		sctp_auth_key_acquire(stcb, sp->auth_keyid);
 		sp->holds_key_ref = 1;
 	}
 	*error = sctp_copy_one(sp, uio, resv_in_first);
 skip_copy:
 	if (*error) {
 		sctp_free_a_strmoq(stcb, sp, SCTP_SO_LOCKED);
 		sp = NULL;
 	} else {
 		if (sp->sinfo_flags & SCTP_ADDR_OVER) {
 			sp->net = net;
 			atomic_add_int(&sp->net->ref_count, 1);
 		} else {
 			sp->net = NULL;
 		}
 		sctp_set_prsctp_policy(sp);
 	}
 out_now:
 	return (sp);
 }
 
 int
 sctp_sosend(struct socket *so,
     struct sockaddr *addr,
     struct uio *uio,
     struct mbuf *top,
     struct mbuf *control,
     int flags,
     struct thread *p)
 {
 	struct sctp_sndrcvinfo sndrcvninfo;
 #if defined(INET) && defined(INET6)
 	struct sockaddr_in sin;
 #endif
 	struct sockaddr *addr_to_use;
 	int error;
 	bool use_sndinfo;
 
 	if (control != NULL) {
 		/* process cmsg snd/rcv info (maybe a assoc-id) */
 		use_sndinfo = sctp_find_cmsg(SCTP_SNDRCV, (void *)&sndrcvninfo, control, sizeof(sndrcvninfo));
 	} else {
 		use_sndinfo = false;
 	}
 #if defined(INET) && defined(INET6)
 	if ((addr != NULL) && (addr->sa_family == AF_INET6)) {
 		struct sockaddr_in6 *sin6;
 
 		if (addr->sa_len != sizeof(struct sockaddr_in6)) {
 			SCTP_LTRACE_ERR_RET(NULL, NULL, NULL, SCTP_FROM_SCTP_OUTPUT, EINVAL);
 			return (EINVAL);
 		}
 		sin6 = (struct sockaddr_in6 *)addr;
 		if (IN6_IS_ADDR_V4MAPPED(&sin6->sin6_addr)) {
 			in6_sin6_2_sin(&sin, sin6);
 			addr_to_use = (struct sockaddr *)&sin;
 		} else {
 			addr_to_use = addr;
 		}
 	} else {
 		addr_to_use = addr;
 	}
 #else
 	addr_to_use = addr;
 #endif
 	error = sctp_lower_sosend(so, addr_to_use, uio, top, control, flags,
 	    use_sndinfo ? &sndrcvninfo : NULL, p);
 	return (error);
 }
 
 int
 sctp_lower_sosend(struct socket *so,
     struct sockaddr *addr,
     struct uio *uio,
     struct mbuf *top,
     struct mbuf *control,
     int flags,
     struct sctp_sndrcvinfo *srcv,
     struct thread *p)
 {
 	struct sctp_nonpad_sndrcvinfo sndrcvninfo_buf;
 	struct epoch_tracker et;
 	struct timeval now;
 	struct sctp_block_entry be;
 	struct sctp_inpcb *inp;
 	struct sctp_tcb *stcb = NULL;
 	struct sctp_nets *net;
 	struct sctp_association *asoc;
 	struct sctp_inpcb *t_inp;
 	struct sctp_nonpad_sndrcvinfo *sndrcvninfo;
 	ssize_t sndlen = 0, max_len, local_add_more;
 	ssize_t local_soresv = 0;
 	sctp_assoc_t sinfo_assoc_id;
 	int user_marks_eor;
 	int nagle_applies = 0;
 	int error;
 	int queue_only = 0, queue_only_for_init = 0;
 	int un_sent;
 	int now_filled = 0;
 	unsigned int inqueue_bytes = 0;
 	uint16_t port;
 	uint16_t sinfo_flags;
 	uint16_t sinfo_stream;
 	bool create_lock_applied = false;
 	bool free_cnt_applied = false;
 	bool some_on_control;
 	bool got_all_of_the_send = false;
 	bool non_blocking = false;
 
 	error = 0;
 	net = NULL;
 	stcb = NULL;
 
 	if ((uio == NULL) && (top == NULL)) {
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	if (addr != NULL) {
 		union sctp_sockstore *raddr = (union sctp_sockstore *)addr;
 
 		switch (raddr->sa.sa_family) {
 #ifdef INET
 		case AF_INET:
 			if (raddr->sin.sin_len != sizeof(struct sockaddr_in)) {
 				error = EINVAL;
 				goto out_unlocked;
 			}
 			port = raddr->sin.sin_port;
 			break;
 #endif
 #ifdef INET6
 		case AF_INET6:
 			if (raddr->sin6.sin6_len != sizeof(struct sockaddr_in6)) {
 				error = EINVAL;
 				goto out_unlocked;
 			}
 			port = raddr->sin6.sin6_port;
 			break;
 #endif
 		default:
 			error = EAFNOSUPPORT;
 			goto out_unlocked;
 		}
 	} else {
 		port = 0;
 	}
 	if (uio != NULL) {
 		if (uio->uio_resid < 0) {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 		sndlen = uio->uio_resid;
 	} else {
 		sndlen = SCTP_HEADER_LEN(top);
 	}
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "Send called addr:%p send length %zd\n",
 	    (void *)addr, sndlen);
 
 	t_inp = inp = (struct sctp_inpcb *)so->so_pcb;
 	if (inp == NULL) {
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	user_marks_eor = sctp_is_feature_on(inp, SCTP_PCB_FLAGS_EXPLICIT_EOR);
 	if ((uio == NULL) && (user_marks_eor != 0)) {
 		/*-
 		 * We do not support eeor mode for
 		 * sending with mbuf chains (like sendfile).
 		 */
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	if ((inp->sctp_flags & SCTP_PCB_FLAGS_TCPTYPE) &&
 	    SCTP_IS_LISTENING(inp)) {
 		/* The listener can NOT send. */
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	atomic_add_int(&inp->total_sends, 1);
 
 	if (srcv != NULL) {
 		sndrcvninfo = (struct sctp_nonpad_sndrcvinfo *)srcv;
 		sinfo_assoc_id = sndrcvninfo->sinfo_assoc_id;
 		sinfo_flags = sndrcvninfo->sinfo_flags;
 		if (INVALID_SINFO_FLAG(sinfo_flags) ||
 		    PR_SCTP_INVALID_POLICY(sinfo_flags)) {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 		if (sinfo_flags != 0) {
 			SCTP_STAT_INCR(sctps_sends_with_flags);
 		}
 	} else {
 		sndrcvninfo = NULL;
 		sinfo_flags = inp->def_send.sinfo_flags;
 		sinfo_assoc_id = inp->def_send.sinfo_assoc_id;
 	}
 	if (flags & MSG_EOR) {
 		sinfo_flags |= SCTP_EOR;
 	}
 	if (flags & MSG_EOF) {
 		sinfo_flags |= SCTP_EOF;
 	}
 	if ((sinfo_flags & SCTP_ADDR_OVER) && (addr == NULL)) {
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	SCTP_INP_RLOCK(inp);
 	if ((sinfo_flags & SCTP_SENDALL) &&
 	    (inp->sctp_flags & SCTP_PCB_FLAGS_UDPTYPE)) {
 		SCTP_INP_RUNLOCK(inp);
 		error = sctp_sendall(inp, uio, top, sndrcvninfo);
 		top = NULL;
 		goto out_unlocked;
 	}
 	/* Now we must find the association. */
 	if ((inp->sctp_flags & SCTP_PCB_FLAGS_CONNECTED) ||
 	    (inp->sctp_flags & SCTP_PCB_FLAGS_IN_TCPPOOL)) {
 		stcb = LIST_FIRST(&inp->sctp_asoc_list);
 		if (stcb != NULL) {
 			SCTP_TCB_LOCK(stcb);
 		}
 		SCTP_INP_RUNLOCK(inp);
 	} else if (sinfo_assoc_id > SCTP_ALL_ASSOC) {
 		stcb = sctp_findasoc_ep_asocid_locked(inp, sinfo_assoc_id, 1);
 		SCTP_INP_RUNLOCK(inp);
 		if (stcb != NULL) {
 			SCTP_TCB_LOCK_ASSERT(stcb);
 		}
 	} else if (addr != NULL) {
 		/*-
 		 * Since we did not use findep we must
 		 * increment it, and if we don't find a tcb
 		 * decrement it.
 		 */
 		SCTP_INP_INCR_REF(inp);
 		SCTP_INP_RUNLOCK(inp);
 		stcb = sctp_findassociation_ep_addr(&t_inp, addr, &net, NULL, NULL);
 		if (stcb == NULL) {
 			SCTP_INP_WLOCK(inp);
 			SCTP_INP_DECR_REF(inp);
 			SCTP_INP_WUNLOCK(inp);
 		} else {
 			SCTP_TCB_LOCK_ASSERT(stcb);
 		}
 	} else {
 		SCTP_INP_RUNLOCK(inp);
 	}
 
 #ifdef INVARIANTS
 	if (stcb != NULL) {
 		SCTP_TCB_LOCK_ASSERT(stcb);
 	}
 #endif
 
 	if ((stcb == NULL) && (addr != NULL)) {
 		/* Possible implicit send? */
 		SCTP_ASOC_CREATE_LOCK(inp);
 		create_lock_applied = true;
 		if ((inp->sctp_flags & SCTP_PCB_FLAGS_SOCKET_GONE) ||
 		    (inp->sctp_flags & SCTP_PCB_FLAGS_SOCKET_ALLGONE)) {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 		if (((inp->sctp_flags & SCTP_PCB_FLAGS_BOUND_V6) == 0) &&
 		    (addr->sa_family == AF_INET6)) {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 		SCTP_INP_WLOCK(inp);
 		SCTP_INP_INCR_REF(inp);
 		SCTP_INP_WUNLOCK(inp);
 		/* With the lock applied look again */
 		stcb = sctp_findassociation_ep_addr(&t_inp, addr, &net, NULL, NULL);
 #if defined(INET) || defined(INET6)
 		if ((stcb == NULL) && (control != NULL) && (port > 0)) {
 			stcb = sctp_findassociation_cmsgs(&t_inp, port, control, &net, &error);
 		}
 #endif
 		if (stcb == NULL) {
 			SCTP_INP_WLOCK(inp);
 			SCTP_INP_DECR_REF(inp);
 			SCTP_INP_WUNLOCK(inp);
 		} else {
 			SCTP_TCB_LOCK_ASSERT(stcb);
 			SCTP_ASOC_CREATE_UNLOCK(inp);
 			create_lock_applied = false;
 		}
 		if (error != 0) {
 			goto out_unlocked;
 		}
 		if (t_inp != inp) {
 			error = ENOTCONN;
 			goto out_unlocked;
 		}
 	}
 	if (stcb == NULL) {
 		if (addr == NULL) {
 			error = ENOENT;
 			goto out_unlocked;
 		} else {
 			/* We must go ahead and start the INIT process */
 			uint32_t vrf_id;
 
 			if ((sinfo_flags & SCTP_ABORT) ||
 			    ((sinfo_flags & SCTP_EOF) && (sndlen == 0))) {
 				/*-
 				 * User asks to abort a non-existent assoc,
 				 * or EOF a non-existent assoc with no data
 				 */
 				error = ENOENT;
 				goto out_unlocked;
 			}
 			/* get an asoc/stcb struct */
 			vrf_id = inp->def_vrf_id;
 			KASSERT(create_lock_applied, ("create_lock_applied is false"));
 			stcb = sctp_aloc_assoc_connected(inp, addr, &error, 0, 0, vrf_id,
 			    inp->sctp_ep.pre_open_stream_count,
 			    inp->sctp_ep.port,
 			    p,
 			    SCTP_INITIALIZE_AUTH_PARAMS);
 			if (stcb == NULL) {
 				/* error is setup for us in the call. */
 				KASSERT(error != 0, ("error is 0 although stcb is NULL"));
 				goto out_unlocked;
 			}
 			SCTP_TCB_LOCK_ASSERT(stcb);
 			SCTP_ASOC_CREATE_UNLOCK(inp);
 			create_lock_applied = false;
 			/*
 			 * Turn on queue only flag to prevent data from
 			 * being sent
 			 */
 			queue_only = 1;
 			SCTP_SET_STATE(stcb, SCTP_STATE_COOKIE_WAIT);
 			(void)SCTP_GETTIME_TIMEVAL(&stcb->asoc.time_entered);
 			if (control != NULL) {
 				if (sctp_process_cmsgs_for_init(stcb, control, &error)) {
 					sctp_free_assoc(inp, stcb, SCTP_NORMAL_PROC,
 					    SCTP_FROM_SCTP_OUTPUT + SCTP_LOC_6);
 					stcb = NULL;
 					KASSERT(error != 0,
 					    ("error is 0 although sctp_process_cmsgs_for_init() indicated an error"));
 					goto out_unlocked;
 				}
 			}
 			/* out with the INIT */
 			queue_only_for_init = 1;
 			/*-
 			 * we may want to dig in after this call and adjust the MTU
 			 * value. It defaulted to 1500 (constant) but the ro
 			 * structure may now have an update and thus we may need to
 			 * change it BEFORE we append the message.
 			 */
 		}
 	}
 
 	KASSERT(!create_lock_applied, ("create_lock_applied is true"));
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 
 	asoc = &stcb->asoc;
 	if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 	    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 		if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 			/* XXX: Could also be ECONNABORTED, not enough info. */
 			error = ECONNRESET;
 		} else {
 			error = ENOTCONN;
 		}
 		goto out_unlocked;
 	}
 	if ((SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_WAIT) ||
 	    (SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_ECHOED)) {
 		queue_only = 1;
 	}
 	/* Keep the stcb from being freed under our feet. */
 	atomic_add_int(&asoc->refcnt, 1);
 	free_cnt_applied = true;
 	if (sndrcvninfo == NULL) {
 		/* Use a local copy to have a consistent view. */
 		sndrcvninfo_buf = asoc->def_send;
 		sndrcvninfo = &sndrcvninfo_buf;
 		sinfo_flags = sndrcvninfo->sinfo_flags;
 		if (flags & MSG_EOR) {
 			sinfo_flags |= SCTP_EOR;
 		}
 		if (flags & MSG_EOF) {
 			sinfo_flags |= SCTP_EOF;
 		}
 	}
 	/* Are we aborting? */
 	if (sinfo_flags & SCTP_ABORT) {
 		struct mbuf *mm;
 		struct sctp_paramhdr *ph;
 		ssize_t tot_demand, tot_out = 0, max_out;
 
 		SCTP_STAT_INCR(sctps_sends_with_abort);
 		if ((SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_WAIT) ||
 		    (SCTP_GET_STATE(stcb) == SCTP_STATE_COOKIE_ECHOED)) {
 			/* It has to be up before we abort. */
 			error = EINVAL;
 			goto out_unlocked;
 		}
 		/* How big is the user initiated abort? */
 		if (top != NULL) {
 			struct mbuf *cntm;
 
 			if (sndlen != 0) {
 				for (cntm = top; cntm; cntm = SCTP_BUF_NEXT(cntm)) {
 					tot_out += SCTP_BUF_LEN(cntm);
 				}
 			}
 			mm = sctp_get_mbuf_for_msg(sizeof(struct sctp_paramhdr), 0, M_NOWAIT, 1, MT_DATA);
 		} else {
 			/* Must fit in a MTU */
 			tot_out = sndlen;
 			tot_demand = (tot_out + sizeof(struct sctp_paramhdr));
 			if (tot_demand > SCTP_DEFAULT_ADD_MORE) {
 				error = EMSGSIZE;
 				goto out_unlocked;
 			}
 			mm = sctp_get_mbuf_for_msg((unsigned int)tot_demand, 0, M_NOWAIT, 1, MT_DATA);
 		}
 		if (mm == NULL) {
 			error = ENOMEM;
 			goto out_unlocked;
 		}
 		max_out = asoc->smallest_mtu - sizeof(struct sctp_paramhdr);
 		max_out -= sizeof(struct sctp_abort_msg);
 		if (tot_out > max_out) {
 			tot_out = max_out;
 		}
 		ph = mtod(mm, struct sctp_paramhdr *);
 		ph->param_type = htons(SCTP_CAUSE_USER_INITIATED_ABT);
 		ph->param_length = htons((uint16_t)(sizeof(struct sctp_paramhdr) + tot_out));
 		ph++;
 		SCTP_BUF_LEN(mm) = (int)(tot_out + sizeof(struct sctp_paramhdr));
 		if (top == NULL) {
 			SCTP_TCB_UNLOCK(stcb);
 			error = uiomove((caddr_t)ph, (int)tot_out, uio);
 			SCTP_TCB_LOCK(stcb);
 			if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 			    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 				sctp_m_freem(mm);
 				if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 					/*
 					 * XXX: Could also be ECONNABORTED,
 					 * not enough info.
 					 */
 					error = ECONNRESET;
 				} else {
 					error = ENOTCONN;
 				}
 				goto out_unlocked;
 			}
 			if (error != 0) {
 				/*-
 				 * Here if we can't get his data we
 				 * still abort we just don't get to
 				 * send the users note :-0
 				 */
 				sctp_m_freem(mm);
 				mm = NULL;
 				error = 0;
 			}
 		} else {
 			if (sndlen != 0) {
 				SCTP_BUF_NEXT(mm) = top;
 			}
 		}
 		atomic_subtract_int(&asoc->refcnt, 1);
 		free_cnt_applied = false;
 		/* release this lock, otherwise we hang on ourselves */
 		NET_EPOCH_ENTER(et);
 		sctp_abort_an_association(stcb->sctp_ep, stcb, mm, false, SCTP_SO_LOCKED);
 		NET_EPOCH_EXIT(et);
 		stcb = NULL;
 		/*
 		 * In this case top is already chained to mm avoid double
 		 * free, since we free it below if top != NULL and driver
 		 * would free it after sending the packet out
 		 */
 		if (sndlen != 0) {
 			top = NULL;
 		}
 		goto out_unlocked;
 	}
 
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	if (sinfo_flags & SCTP_ADDR_OVER) {
 		if (addr != NULL) {
 			net = sctp_findnet(stcb, addr);
 		} else {
 			net = NULL;
 		}
 		if ((net == NULL) ||
 		    ((port != 0) && (port != stcb->rport))) {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 	} else {
 		if (asoc->alternate != NULL) {
 			net = asoc->alternate;
 		} else {
 			net = asoc->primary_destination;
 		}
 	}
 	if (sndlen == 0) {
 		if (sinfo_flags & SCTP_EOF) {
 			got_all_of_the_send = true;
 			goto dataless_eof;
 		} else {
 			error = EINVAL;
 			goto out_unlocked;
 		}
 	}
 	if (sctp_is_feature_on(inp, SCTP_PCB_FLAGS_NO_FRAGMENT)) {
 		if (sndlen > (ssize_t)asoc->smallest_mtu) {
 			error = EMSGSIZE;
 			goto out_unlocked;
 		}
 	}
 	sinfo_stream = sndrcvninfo->sinfo_stream;
 	/* Is the stream no. valid? */
 	if (sinfo_stream >= asoc->streamoutcnt) {
 		/* Invalid stream number */
 		error = EINVAL;
 		goto out_unlocked;
 	}
 	if ((asoc->strmout[sinfo_stream].state != SCTP_STREAM_OPEN) &&
 	    (asoc->strmout[sinfo_stream].state != SCTP_STREAM_OPENING)) {
 		/*
 		 * Can't queue any data while stream reset is underway.
 		 */
 		if (asoc->strmout[sinfo_stream].state > SCTP_STREAM_OPEN) {
 			error = EAGAIN;
 		} else {
 			error = EINVAL;
 		}
 		goto out_unlocked;
 	}
 	atomic_add_int(&stcb->total_sends, 1);
 	if (SCTP_SO_IS_NBIO(so) || (flags & (MSG_NBIO | MSG_DONTWAIT)) != 0) {
 		non_blocking = true;
 	}
 	if (non_blocking) {
 		ssize_t amount;
 
 		inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 		if (user_marks_eor == 0) {
 			amount = sndlen;
 		} else {
 			amount = 1;
 		}
 		if ((SCTP_SB_LIMIT_SND(so) < (amount + inqueue_bytes + asoc->sb_send_resv)) ||
 		    (asoc->chunks_on_out_queue >= SCTP_BASE_SYSCTL(sctp_max_chunks_on_queue))) {
 			if ((sndlen > (ssize_t)SCTP_SB_LIMIT_SND(so)) &&
 			    (user_marks_eor == 0)) {
 				error = EMSGSIZE;
 			} else {
 				error = EWOULDBLOCK;
 			}
 			goto out_unlocked;
 		}
 	}
 	atomic_add_int(&asoc->sb_send_resv, (int)sndlen);
 	local_soresv = sndlen;
 
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	/* Ok, we will attempt a msgsnd :> */
 	if (p != NULL) {
 		p->td_ru.ru_msgsnd++;
 	}
 	/* Calculate the maximum we can send */
 	inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 	if (SCTP_SB_LIMIT_SND(so) > inqueue_bytes) {
 		max_len = SCTP_SB_LIMIT_SND(so) - inqueue_bytes;
 	} else {
 		max_len = 0;
 	}
 	/* Unless E_EOR mode is on, we must make a send FIT in one call. */
 	if ((user_marks_eor == 0) &&
 	    (sndlen > (ssize_t)SCTP_SB_LIMIT_SND(stcb->sctp_socket))) {
 		/* It will NEVER fit. */
 		error = EMSGSIZE;
 		goto out_unlocked;
 	}
 	if (user_marks_eor != 0) {
 		local_add_more = (ssize_t)min(SCTP_SB_LIMIT_SND(so), SCTP_BASE_SYSCTL(sctp_add_more_threshold));
 	} else {
 		/*-
 		 * For non-eeor the whole message must fit in
 		 * the socket send buffer.
 		 */
 		local_add_more = sndlen;
 	}
 	if (non_blocking) {
 		goto skip_preblock;
 	}
 	if (((max_len <= local_add_more) && ((ssize_t)SCTP_SB_LIMIT_SND(so) >= local_add_more)) ||
 	    (max_len == 0) ||
 	    ((asoc->chunks_on_out_queue + asoc->stream_queue_cnt) >= SCTP_BASE_SYSCTL(sctp_max_chunks_on_queue))) {
 		/* No room right now! */
 		inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 		SOCKBUF_LOCK(&so->so_snd);
 		while ((SCTP_SB_LIMIT_SND(so) < (inqueue_bytes + local_add_more)) ||
 		    ((asoc->stream_queue_cnt + asoc->chunks_on_out_queue) >= SCTP_BASE_SYSCTL(sctp_max_chunks_on_queue))) {
 			SCTPDBG(SCTP_DEBUG_OUTPUT1, "pre_block limit:%u <(inq:%d + %zd) || (%d+%d > %d)\n",
 			    (unsigned int)SCTP_SB_LIMIT_SND(so),
 			    inqueue_bytes,
 			    local_add_more,
 			    asoc->stream_queue_cnt,
 			    asoc->chunks_on_out_queue,
 			    SCTP_BASE_SYSCTL(sctp_max_chunks_on_queue));
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 				sctp_log_block(SCTP_BLOCK_LOG_INTO_BLKA, asoc, sndlen);
 			}
 			be.error = 0;
 			stcb->block_entry = &be;
 			SCTP_TCB_UNLOCK(stcb);
 			error = sbwait(so, SO_SND);
 			if (error == 0) {
 				if (so->so_error != 0) {
 					error = so->so_error;
 				}
 				if (be.error != 0) {
 					error = be.error;
 				}
 			}
 			SOCKBUF_UNLOCK(&so->so_snd);
 			SCTP_TCB_LOCK(stcb);
 			stcb->block_entry = NULL;
 			if (error != 0) {
 				goto out_unlocked;
 			}
 			if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 			    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 				if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 					/*
 					 * XXX: Could also be ECONNABORTED,
 					 * not enough info.
 					 */
 					error = ECONNRESET;
 				} else {
 					error = ENOTCONN;
 				}
 				goto out_unlocked;
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 				sctp_log_block(SCTP_BLOCK_LOG_OUTOF_BLK,
 				    asoc, asoc->total_output_queue_size);
 			}
 			inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 			SOCKBUF_LOCK(&so->so_snd);
 		}
 		if (SCTP_SB_LIMIT_SND(so) > inqueue_bytes) {
 			max_len = SCTP_SB_LIMIT_SND(so) - inqueue_bytes;
 		} else {
 			max_len = 0;
 		}
 		SOCKBUF_UNLOCK(&so->so_snd);
 	}
 
 skip_preblock:
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	/*
 	 * sndlen covers for mbuf case uio_resid covers for the non-mbuf
 	 * case NOTE: uio will be null when top/mbuf is passed
 	 */
 	if (top == NULL) {
 		struct sctp_stream_queue_pending *sp;
 		struct sctp_stream_out *strm;
 		uint32_t sndout;
 
 		if ((asoc->stream_locked) &&
 		    (asoc->stream_locked_on != sinfo_stream)) {
 			error = EINVAL;
 			goto out;
 		}
 		strm = &asoc->strmout[sinfo_stream];
 		if (strm->last_msg_incomplete == 0) {
 	do_a_copy_in:
 			SCTP_TCB_UNLOCK(stcb);
 			sp = sctp_copy_it_in(stcb, asoc, sndrcvninfo, uio, net, max_len, user_marks_eor, &error);
 			SCTP_TCB_LOCK(stcb);
 			if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 			    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 				if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 					/*
 					 * XXX: Could also be ECONNABORTED,
 					 * not enough info.
 					 */
 					error = ECONNRESET;
 				} else {
 					error = ENOTCONN;
 				}
 				goto out;
 			}
 			if (error != 0) {
 				goto out;
 			}
 			/*
 			 * Reject the sending of a new user message, if the
 			 * association is about to be shut down.
 			 */
 			if ((SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_SENT) ||
 			    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_RECEIVED) ||
 			    (SCTP_GET_STATE(stcb) == SCTP_STATE_SHUTDOWN_ACK_SENT) ||
 			    (asoc->state & SCTP_STATE_SHUTDOWN_PENDING)) {
 				if (sp->data != 0) {
 					sctp_m_freem(sp->data);
 					sp->data = NULL;
 					sp->tail_mbuf = NULL;
 					sp->length = 0;
 				}
 				if (sp->net != NULL) {
 					sctp_free_remote_addr(sp->net);
 					sp->net = NULL;
 				}
 				sctp_free_a_strmoq(stcb, sp, SCTP_SO_LOCKED);
 				error = EPIPE;
 				goto out_unlocked;
 			}
 			/* The out streams might be reallocated. */
 			strm = &asoc->strmout[sinfo_stream];
 			if (sp->msg_is_complete) {
 				strm->last_msg_incomplete = 0;
 				asoc->stream_locked = 0;
 			} else {
 				/*
 				 * Just got locked to this guy in case of an
 				 * interrupt.
 				 */
 				strm->last_msg_incomplete = 1;
 				if (asoc->idata_supported == 0) {
 					asoc->stream_locked = 1;
 					asoc->stream_locked_on = sinfo_stream;
 				}
 				sp->sender_all_done = 0;
 			}
 			sctp_snd_sb_alloc(stcb, sp->length);
 			atomic_add_int(&asoc->stream_queue_cnt, 1);
 			if (sinfo_flags & SCTP_UNORDERED) {
 				SCTP_STAT_INCR(sctps_sends_with_unord);
 			}
 			sp->processing = 1;
 			TAILQ_INSERT_TAIL(&strm->outqueue, sp, next);
 			asoc->ss_functions.sctp_ss_add_to_stream(stcb, asoc, strm, sp);
 		} else {
 			sp = TAILQ_LAST(&strm->outqueue, sctp_streamhead);
 			if (sp == NULL) {
 				/* ???? Huh ??? last msg is gone */
 #ifdef INVARIANTS
 				panic("Warning: Last msg marked incomplete, yet nothing left?");
 #else
 				SCTP_PRINTF("Warning: Last msg marked incomplete, yet nothing left?\n");
 				strm->last_msg_incomplete = 0;
 #endif
 				goto do_a_copy_in;
 			}
 			if (sp->processing != 0) {
 				error = EINVAL;
 				goto out;
 			} else {
 				sp->processing = 1;
 			}
 		}
 
 		KASSERT(stcb != NULL, ("stcb is NULL"));
 		SCTP_TCB_LOCK_ASSERT(stcb);
 		KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 		    ("Association about to be freed"));
 		KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 		    ("Association was aborted"));
 
 		while (uio->uio_resid > 0) {
 			/* How much room do we have? */
 			struct mbuf *new_tail, *mm;
 
 			inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 			if (SCTP_SB_LIMIT_SND(so) > inqueue_bytes) {
 				max_len = SCTP_SB_LIMIT_SND(so) - inqueue_bytes;
 			} else {
 				max_len = 0;
 			}
 			if ((max_len > (ssize_t)SCTP_BASE_SYSCTL(sctp_add_more_threshold)) ||
 			    ((max_len > 0) && (SCTP_SB_LIMIT_SND(so) < SCTP_BASE_SYSCTL(sctp_add_more_threshold))) ||
 			    (uio->uio_resid <= max_len)) {
 				SCTP_TCB_UNLOCK(stcb);
 				sndout = 0;
 				new_tail = NULL;
 				mm = sctp_copy_resume(uio, (int)max_len, user_marks_eor, &error, &sndout, &new_tail);
 				SCTP_TCB_LOCK(stcb);
 				if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 				    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 					/*
 					 * We need to get out. Peer probably
 					 * aborted.
 					 */
 					sctp_m_freem(mm);
 					if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 						/*
 						 * XXX: Could also be
 						 * ECONNABORTED, not enough
 						 * info.
 						 */
 						error = ECONNRESET;
 					} else {
 						error = ENOTCONN;
 					}
 					goto out;
 				}
 				if ((mm == NULL) || (error != 0)) {
 					if (mm != NULL) {
 						sctp_m_freem(mm);
 					}
 					if (sp != NULL) {
 						sp->processing = 0;
 					}
 					goto out;
 				}
 				/* Update the mbuf and count */
 				if (sp->tail_mbuf != NULL) {
 					/* Tack it to the end. */
 					SCTP_BUF_NEXT(sp->tail_mbuf) = mm;
 				} else {
 					/* A stolen mbuf. */
 					sp->data = mm;
 				}
 				sp->tail_mbuf = new_tail;
 				sctp_snd_sb_alloc(stcb, sndout);
 				atomic_add_int(&sp->length, sndout);
 				if (sinfo_flags & SCTP_SACK_IMMEDIATELY) {
 					sp->sinfo_flags |= SCTP_SACK_IMMEDIATELY;
 				}
 
 				/* Did we reach EOR? */
 				if ((uio->uio_resid == 0) &&
 				    ((user_marks_eor == 0) ||
 				    (sinfo_flags & SCTP_EOF) ||
 				    (user_marks_eor && (sinfo_flags & SCTP_EOR)))) {
 					sp->msg_is_complete = 1;
 				} else {
 					sp->msg_is_complete = 0;
 				}
 			}
 
 			KASSERT(stcb != NULL, ("stcb is NULL"));
 			SCTP_TCB_LOCK_ASSERT(stcb);
 			KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 			    ("Association about to be freed"));
 			KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 			    ("Association was aborted"));
 
 			if (uio->uio_resid == 0) {
 				/* got it all? */
 				continue;
 			}
 			/* PR-SCTP? */
 			if ((asoc->prsctp_supported) && (asoc->sent_queue_cnt_removeable > 0)) {
 				/*
 				 * This is ugly but we must assure locking
 				 * order
 				 */
 				sctp_prune_prsctp(stcb, asoc, sndrcvninfo, (int)sndlen);
 				inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 				if (SCTP_SB_LIMIT_SND(so) > inqueue_bytes)
 					max_len = SCTP_SB_LIMIT_SND(so) - inqueue_bytes;
 				else
 					max_len = 0;
 				if (max_len > 0) {
 					continue;
 				}
 			}
 			/* wait for space now */
 			if (non_blocking) {
 				/* Non-blocking io in place out */
 				if (sp != NULL) {
 					sp->processing = 0;
 				}
 				goto skip_out_eof;
 			}
 			/* What about the INIT, send it maybe */
 			if (queue_only_for_init) {
 				if (SCTP_GET_STATE(stcb) == SCTP_STATE_OPEN) {
 					/* a collision took us forward? */
 					queue_only = 0;
 				} else {
 					NET_EPOCH_ENTER(et);
 					sctp_send_initiate(inp, stcb, SCTP_SO_LOCKED);
 					NET_EPOCH_EXIT(et);
 					SCTP_SET_STATE(stcb, SCTP_STATE_COOKIE_WAIT);
 					queue_only = 1;
 				}
 			}
 			if ((net->flight_size > net->cwnd) &&
 			    (asoc->sctp_cmt_on_off == 0)) {
 				SCTP_STAT_INCR(sctps_send_cwnd_avoid);
 				queue_only = 1;
 			} else if (asoc->ifp_had_enobuf) {
 				SCTP_STAT_INCR(sctps_ifnomemqueued);
 				if (net->flight_size > (2 * net->mtu)) {
 					queue_only = 1;
 				}
 				asoc->ifp_had_enobuf = 0;
 			}
 			un_sent = asoc->total_output_queue_size - asoc->total_flight;
 			if ((sctp_is_feature_off(inp, SCTP_PCB_FLAGS_NODELAY)) &&
 			    (asoc->total_flight > 0) &&
 			    (asoc->stream_queue_cnt < SCTP_MAX_DATA_BUNDLING) &&
 			    (un_sent < (int)(asoc->smallest_mtu - SCTP_MIN_OVERHEAD))) {
 				/*-
 				 * Ok, Nagle is set on and we have data outstanding.
 				 * Don't send anything and let SACKs drive out the
 				 * data unless we have a "full" segment to send.
 				 */
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_NAGLE_LOGGING_ENABLE) {
 					sctp_log_nagle_event(stcb, SCTP_NAGLE_APPLIED);
 				}
 				SCTP_STAT_INCR(sctps_naglequeued);
 				nagle_applies = 1;
 			} else {
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_NAGLE_LOGGING_ENABLE) {
 					if (sctp_is_feature_off(inp, SCTP_PCB_FLAGS_NODELAY))
 						sctp_log_nagle_event(stcb, SCTP_NAGLE_SKIPPED);
 				}
 				SCTP_STAT_INCR(sctps_naglesent);
 				nagle_applies = 0;
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 				sctp_misc_ints(SCTP_CWNDLOG_PRESEND, queue_only_for_init, queue_only,
 				    nagle_applies, un_sent);
 				sctp_misc_ints(SCTP_CWNDLOG_PRESEND, asoc->total_output_queue_size,
 				    asoc->total_flight,
 				    asoc->chunks_on_out_queue, asoc->total_flight_count);
 			}
 			if (queue_only_for_init) {
 				queue_only_for_init = 0;
 			}
 			if ((queue_only == 0) && (nagle_applies == 0)) {
 				/*-
 				 * need to start chunk output
 				 * before blocking.. note that if
 				 * a lock is already applied, then
 				 * the input via the net is happening
 				 * and I don't need to start output :-D
 				 */
 				NET_EPOCH_ENTER(et);
 				sctp_chunk_output(inp, stcb,
 				    SCTP_OUTPUT_FROM_USR_SEND, SCTP_SO_LOCKED);
 				NET_EPOCH_EXIT(et);
 			}
 			/*-
 			 * This is a bit strange, but I think it will
 			 * work. The total_output_queue_size is locked and
 			 * protected by the TCB_LOCK, which we just released.
 			 * There is a race that can occur between releasing it
 			 * above, and me getting the socket lock, where sacks
 			 * come in but we have not put the SB_WAIT on the
 			 * so_snd buffer to get the wakeup. After the LOCK
 			 * is applied the sack_processing will also need to
 			 * LOCK the so->so_snd to do the actual sowwakeup(). So
 			 * once we have the socket buffer lock if we recheck the
 			 * size we KNOW we will get to sleep safely with the
 			 * wakeup flag in place.
 			 */
 			inqueue_bytes = asoc->total_output_queue_size - (asoc->chunks_on_out_queue * SCTP_DATA_CHUNK_OVERHEAD(stcb));
 			SOCKBUF_LOCK(&so->so_snd);
 			if (SCTP_SB_LIMIT_SND(so) <= (inqueue_bytes +
 			    min(SCTP_BASE_SYSCTL(sctp_add_more_threshold), SCTP_SB_LIMIT_SND(so)))) {
 				if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 					sctp_log_block(SCTP_BLOCK_LOG_INTO_BLK,
 					    asoc, uio->uio_resid);
 				}
 				be.error = 0;
 				stcb->block_entry = &be;
 				SCTP_TCB_UNLOCK(stcb);
 				error = sbwait(so, SO_SND);
 				if (error == 0) {
 					if (so->so_error != 0)
 						error = so->so_error;
 					if (be.error != 0) {
 						error = be.error;
 					}
 				}
 				SOCKBUF_UNLOCK(&so->so_snd);
 				SCTP_TCB_LOCK(stcb);
 				stcb->block_entry = NULL;
 				if ((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) ||
 				    (asoc->state & SCTP_STATE_WAS_ABORTED)) {
 					if (asoc->state & SCTP_STATE_WAS_ABORTED) {
 						/*
 						 * XXX: Could also be
 						 * ECONNABORTED, not enough
 						 * info.
 						 */
 						error = ECONNRESET;
 					} else {
 						error = ENOTCONN;
 					}
 					goto out_unlocked;
 				}
 				if (error != 0) {
 					if (sp != NULL) {
 						sp->processing = 0;
 					}
 					goto out_unlocked;
 				}
 			} else {
 				SOCKBUF_UNLOCK(&so->so_snd);
 			}
 			if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 				sctp_log_block(SCTP_BLOCK_LOG_OUTOF_BLK,
 				    asoc, asoc->total_output_queue_size);
 			}
 		}
 
 		KASSERT(stcb != NULL, ("stcb is NULL"));
 		SCTP_TCB_LOCK_ASSERT(stcb);
 		KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 		    ("Association about to be freed"));
 		KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 		    ("Association was aborted"));
 
 		/* The out streams might be reallocated. */
 		strm = &asoc->strmout[sinfo_stream];
 		if (sp != NULL) {
 			if (sp->msg_is_complete == 0) {
 				strm->last_msg_incomplete = 1;
 				if (asoc->idata_supported == 0) {
 					asoc->stream_locked = 1;
 					asoc->stream_locked_on = sinfo_stream;
 				}
 			} else {
 				sp->sender_all_done = 1;
 				strm->last_msg_incomplete = 0;
 				asoc->stream_locked = 0;
 			}
 			sp->processing = 0;
 		} else {
 			SCTP_PRINTF("Huh no sp TSNH?\n");
 			strm->last_msg_incomplete = 0;
 			asoc->stream_locked = 0;
 		}
 		if (uio->uio_resid == 0) {
 			got_all_of_the_send = true;
 		}
 	} else {
 		error = sctp_msg_append(stcb, net, top, sndrcvninfo);
 		top = NULL;
 		if ((sinfo_flags & SCTP_EOF) != 0) {
 			got_all_of_the_send = true;
 		}
 	}
 	if (error != 0) {
 		goto out;
 	}
 
 dataless_eof:
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	/* EOF thing ? */
 	if ((sinfo_flags & SCTP_EOF) && got_all_of_the_send) {
 		SCTP_STAT_INCR(sctps_sends_with_eof);
 		error = 0;
 		if (TAILQ_EMPTY(&asoc->send_queue) &&
 		    TAILQ_EMPTY(&asoc->sent_queue) &&
 		    sctp_is_there_unsent_data(stcb, SCTP_SO_LOCKED) == 0) {
 			if ((*asoc->ss_functions.sctp_ss_is_user_msgs_incomplete) (stcb, asoc)) {
 				goto abort_anyway;
 			}
 			/* there is nothing queued to send, so I'm done... */
 			if ((SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_SENT) &&
 			    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_RECEIVED) &&
 			    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_ACK_SENT)) {
 				struct sctp_nets *netp;
 
 				/* only send SHUTDOWN the first time through */
 				if (SCTP_GET_STATE(stcb) == SCTP_STATE_OPEN) {
 					SCTP_STAT_DECR_GAUGE32(sctps_currestab);
 				}
 				SCTP_SET_STATE(stcb, SCTP_STATE_SHUTDOWN_SENT);
 				sctp_stop_timers_for_shutdown(stcb);
 				if (asoc->alternate != NULL) {
 					netp = asoc->alternate;
 				} else {
 					netp = asoc->primary_destination;
 				}
 				sctp_send_shutdown(stcb, netp);
 				sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWN, stcb->sctp_ep, stcb,
 				    netp);
 				sctp_timer_start(SCTP_TIMER_TYPE_SHUTDOWNGUARD, stcb->sctp_ep, stcb,
 				    NULL);
 			}
 		} else {
 			/*-
 			 * we still got (or just got) data to send, so set
 			 * SHUTDOWN_PENDING
 			 */
 			/*-
 			 * XXX sockets draft says that SCTP_EOF should be
 			 * sent with no data.  currently, we will allow user
 			 * data to be sent first and move to
 			 * SHUTDOWN-PENDING
 			 */
 			if ((SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_SENT) &&
 			    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_RECEIVED) &&
 			    (SCTP_GET_STATE(stcb) != SCTP_STATE_SHUTDOWN_ACK_SENT)) {
 				if ((*asoc->ss_functions.sctp_ss_is_user_msgs_incomplete) (stcb, asoc)) {
 					SCTP_ADD_SUBSTATE(stcb, SCTP_STATE_PARTIAL_MSG_LEFT);
 				}
 				SCTP_ADD_SUBSTATE(stcb, SCTP_STATE_SHUTDOWN_PENDING);
 				if (TAILQ_EMPTY(&asoc->send_queue) &&
 				    TAILQ_EMPTY(&asoc->sent_queue) &&
 				    (asoc->state & SCTP_STATE_PARTIAL_MSG_LEFT)) {
 					struct mbuf *op_err;
 					char msg[SCTP_DIAG_INFO_LEN];
 
 			abort_anyway:
 					if (free_cnt_applied) {
 						atomic_subtract_int(&asoc->refcnt, 1);
 						free_cnt_applied = false;
 					}
 					SCTP_SNPRINTF(msg, sizeof(msg),
 					    "%s:%d at %s", __FILE__, __LINE__, __func__);
 					op_err = sctp_generate_cause(SCTP_BASE_SYSCTL(sctp_diag_info_code),
 					    msg);
 					NET_EPOCH_ENTER(et);
 					sctp_abort_an_association(stcb->sctp_ep, stcb,
 					    op_err, false, SCTP_SO_LOCKED);
 					NET_EPOCH_EXIT(et);
 					stcb = NULL;
 					error = ECONNABORTED;
 					goto out;
 				}
 				sctp_feature_off(inp, SCTP_PCB_FLAGS_NODELAY);
 			}
 		}
 	}
 
 skip_out_eof:
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	some_on_control = !TAILQ_EMPTY(&asoc->control_send_queue);
 	if (queue_only_for_init) {
 		if (SCTP_GET_STATE(stcb) == SCTP_STATE_OPEN) {
 			/* a collision took us forward? */
 			queue_only = 0;
 		} else {
 			NET_EPOCH_ENTER(et);
 			sctp_send_initiate(inp, stcb, SCTP_SO_LOCKED);
 			NET_EPOCH_EXIT(et);
 			SCTP_SET_STATE(stcb, SCTP_STATE_COOKIE_WAIT);
 			queue_only = 1;
 		}
 	}
 
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	if ((net->flight_size > net->cwnd) &&
 	    (asoc->sctp_cmt_on_off == 0)) {
 		SCTP_STAT_INCR(sctps_send_cwnd_avoid);
 		queue_only = 1;
 	} else if (asoc->ifp_had_enobuf) {
 		SCTP_STAT_INCR(sctps_ifnomemqueued);
 		if (net->flight_size > (2 * net->mtu)) {
 			queue_only = 1;
 		}
 		asoc->ifp_had_enobuf = 0;
 	}
 	un_sent = asoc->total_output_queue_size - asoc->total_flight;
 	if ((sctp_is_feature_off(inp, SCTP_PCB_FLAGS_NODELAY)) &&
 	    (asoc->total_flight > 0) &&
 	    (asoc->stream_queue_cnt < SCTP_MAX_DATA_BUNDLING) &&
 	    (un_sent < (int)(asoc->smallest_mtu - SCTP_MIN_OVERHEAD))) {
 		/*-
 		 * Ok, Nagle is set on and we have data outstanding.
 		 * Don't send anything and let SACKs drive out the
 		 * data unless wen have a "full" segment to send.
 		 */
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_NAGLE_LOGGING_ENABLE) {
 			sctp_log_nagle_event(stcb, SCTP_NAGLE_APPLIED);
 		}
 		SCTP_STAT_INCR(sctps_naglequeued);
 		nagle_applies = 1;
 	} else {
 		if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_NAGLE_LOGGING_ENABLE) {
 			if (sctp_is_feature_off(inp, SCTP_PCB_FLAGS_NODELAY))
 				sctp_log_nagle_event(stcb, SCTP_NAGLE_SKIPPED);
 		}
 		SCTP_STAT_INCR(sctps_naglesent);
 		nagle_applies = 0;
 	}
 	if (SCTP_BASE_SYSCTL(sctp_logging_level) & SCTP_BLK_LOGGING_ENABLE) {
 		sctp_misc_ints(SCTP_CWNDLOG_PRESEND, queue_only_for_init, queue_only,
 		    nagle_applies, un_sent);
 		sctp_misc_ints(SCTP_CWNDLOG_PRESEND, asoc->total_output_queue_size,
 		    asoc->total_flight,
 		    asoc->chunks_on_out_queue, asoc->total_flight_count);
 	}
 
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 	NET_EPOCH_ENTER(et);
 	if ((queue_only == 0) && (nagle_applies == 0) && (asoc->peers_rwnd && un_sent)) {
 		sctp_chunk_output(inp, stcb, SCTP_OUTPUT_FROM_USR_SEND, SCTP_SO_LOCKED);
 	} else if ((queue_only == 0) &&
 		    (asoc->peers_rwnd == 0) &&
 	    (asoc->total_flight == 0)) {
 		/* We get to have a probe outstanding */
 		sctp_chunk_output(inp, stcb, SCTP_OUTPUT_FROM_USR_SEND, SCTP_SO_LOCKED);
 	} else if (some_on_control) {
 		int num_out, reason;
 
 		/* Here we do control only */
 		(void)sctp_med_chunk_output(inp, stcb, asoc, &num_out,
 		    &reason, 1, 1, &now, &now_filled,
 		    sctp_get_frag_point(stcb),
 		    SCTP_SO_LOCKED);
 	}
 	NET_EPOCH_EXIT(et);
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "USR Send complete qo:%d prw:%d unsent:%d tf:%d cooq:%d toqs:%d err:%d\n",
 	    queue_only, asoc->peers_rwnd, un_sent,
 	    asoc->total_flight, asoc->chunks_on_out_queue,
 	    asoc->total_output_queue_size, error);
 
 	KASSERT(stcb != NULL, ("stcb is NULL"));
 	SCTP_TCB_LOCK_ASSERT(stcb);
 	KASSERT((asoc->state & SCTP_STATE_ABOUT_TO_BE_FREED) == 0,
 	    ("Association about to be freed"));
 	KASSERT((asoc->state & SCTP_STATE_WAS_ABORTED) == 0,
 	    ("Association was aborted"));
 
 out:
 out_unlocked:
 	if (create_lock_applied) {
 		SCTP_ASOC_CREATE_UNLOCK(inp);
 	}
 	if (stcb != NULL) {
 		if (local_soresv) {
 			atomic_subtract_int(&asoc->sb_send_resv, (int)sndlen);
 		}
 		if (free_cnt_applied) {
 			atomic_subtract_int(&asoc->refcnt, 1);
 		}
 		SCTP_TCB_UNLOCK(stcb);
 	}
 	if (top != NULL) {
 		sctp_m_freem(top);
 	}
 	if (control != NULL) {
 		sctp_m_freem(control);
 	}
 	SCTP_LTRACE_ERR_RET(inp, stcb, net, SCTP_FROM_SCTP_OUTPUT, error);
 	return (error);
 }
 
 /*
  * generate an AUTHentication chunk, if required
  */
 struct mbuf *
 sctp_add_auth_chunk(struct mbuf *m, struct mbuf **m_end,
     struct sctp_auth_chunk **auth_ret, uint32_t *offset,
     struct sctp_tcb *stcb, uint8_t chunk)
 {
 	struct mbuf *m_auth;
 	struct sctp_auth_chunk *auth;
 	int chunk_len;
 	struct mbuf *cn;
 
 	if ((m_end == NULL) || (auth_ret == NULL) || (offset == NULL) ||
 	    (stcb == NULL))
 		return (m);
 
 	if (stcb->asoc.auth_supported == 0) {
 		return (m);
 	}
 	/* does the requested chunk require auth? */
 	if (!sctp_auth_is_required_chunk(chunk, stcb->asoc.peer_auth_chunks)) {
 		return (m);
 	}
 	m_auth = sctp_get_mbuf_for_msg(sizeof(*auth), 0, M_NOWAIT, 1, MT_HEADER);
 	if (m_auth == NULL) {
 		/* no mbuf's */
 		return (m);
 	}
 	/* reserve some space if this will be the first mbuf */
 	if (m == NULL)
 		SCTP_BUF_RESV_UF(m_auth, SCTP_MIN_OVERHEAD);
 	/* fill in the AUTH chunk details */
 	auth = mtod(m_auth, struct sctp_auth_chunk *);
 	memset(auth, 0, sizeof(*auth));
 	auth->ch.chunk_type = SCTP_AUTHENTICATION;
 	auth->ch.chunk_flags = 0;
 	chunk_len = sizeof(*auth) +
 	    sctp_get_hmac_digest_len(stcb->asoc.peer_hmac_id);
 	auth->ch.chunk_length = htons(chunk_len);
 	auth->hmac_id = htons(stcb->asoc.peer_hmac_id);
 	/* key id and hmac digest will be computed and filled in upon send */
 
 	/* save the offset where the auth was inserted into the chain */
 	*offset = 0;
 	for (cn = m; cn; cn = SCTP_BUF_NEXT(cn)) {
 		*offset += SCTP_BUF_LEN(cn);
 	}
 
 	/* update length and return pointer to the auth chunk */
 	SCTP_BUF_LEN(m_auth) = chunk_len;
 	m = sctp_copy_mbufchain(m_auth, m, m_end, 1, chunk_len, 0);
 	if (auth_ret != NULL)
 		*auth_ret = auth;
 
 	return (m);
 }
 
 #ifdef INET6
 int
 sctp_v6src_match_nexthop(struct sockaddr_in6 *src6, sctp_route_t *ro)
 {
 	struct nd_prefix *pfx = NULL;
 	struct nd_pfxrouter *pfxrtr = NULL;
 	struct sockaddr_in6 gw6;
 
 	if (ro == NULL || ro->ro_nh == NULL || src6->sin6_family != AF_INET6)
 		return (0);
 
 	/* get prefix entry of address */
 	ND6_RLOCK();
 	LIST_FOREACH(pfx, &MODULE_GLOBAL(nd_prefix), ndpr_entry) {
 		if (pfx->ndpr_stateflags & NDPRF_DETACHED)
 			continue;
 		if (IN6_ARE_MASKED_ADDR_EQUAL(&pfx->ndpr_prefix.sin6_addr,
 		    &src6->sin6_addr, &pfx->ndpr_mask))
 			break;
 	}
 	/* no prefix entry in the prefix list */
 	if (pfx == NULL) {
 		ND6_RUNLOCK();
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "No prefix entry for ");
 		SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, (struct sockaddr *)src6);
 		return (0);
 	}
 
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "v6src_match_nexthop(), Prefix entry is ");
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, (struct sockaddr *)src6);
 
 	/* search installed gateway from prefix entry */
 	LIST_FOREACH(pfxrtr, &pfx->ndpr_advrtrs, pfr_entry) {
 		memset(&gw6, 0, sizeof(struct sockaddr_in6));
 		gw6.sin6_family = AF_INET6;
 		gw6.sin6_len = sizeof(struct sockaddr_in6);
 		memcpy(&gw6.sin6_addr, &pfxrtr->router->rtaddr,
 		    sizeof(struct in6_addr));
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "prefix router is ");
 		SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, (struct sockaddr *)&gw6);
 		SCTPDBG(SCTP_DEBUG_OUTPUT2, "installed router is ");
 		SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &ro->ro_nh->gw_sa);
 		if (sctp_cmpaddr((struct sockaddr *)&gw6, &ro->ro_nh->gw_sa)) {
 			ND6_RUNLOCK();
 			SCTPDBG(SCTP_DEBUG_OUTPUT2, "pfxrouter is installed\n");
 			return (1);
 		}
 	}
 	ND6_RUNLOCK();
 	SCTPDBG(SCTP_DEBUG_OUTPUT2, "pfxrouter is not installed\n");
 	return (0);
 }
 #endif
 
 int
 sctp_v4src_match_nexthop(struct sctp_ifa *sifa, sctp_route_t *ro)
 {
 #ifdef INET
 	struct sockaddr_in *sin, *mask;
 	struct ifaddr *ifa;
 	struct in_addr srcnetaddr, gwnetaddr;
 
 	if (ro == NULL || ro->ro_nh == NULL ||
 	    sifa->address.sa.sa_family != AF_INET) {
 		return (0);
 	}
 	ifa = (struct ifaddr *)sifa->ifa;
 	mask = (struct sockaddr_in *)(ifa->ifa_netmask);
 	sin = &sifa->address.sin;
 	srcnetaddr.s_addr = (sin->sin_addr.s_addr & mask->sin_addr.s_addr);
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "match_nexthop4: src address is ");
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &sifa->address.sa);
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "network address is %x\n", srcnetaddr.s_addr);
 
 	sin = &ro->ro_nh->gw4_sa;
 	gwnetaddr.s_addr = (sin->sin_addr.s_addr & mask->sin_addr.s_addr);
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "match_nexthop4: nexthop is ");
 	SCTPDBG_ADDR(SCTP_DEBUG_OUTPUT2, &ro->ro_nh->gw_sa);
 	SCTPDBG(SCTP_DEBUG_OUTPUT1, "network address is %x\n", gwnetaddr.s_addr);
 	if (srcnetaddr.s_addr == gwnetaddr.s_addr) {
 		return (1);
 	}
 #endif
 	return (0);
 }
diff --git a/sys/netinet/tcp_ecn.c b/sys/netinet/tcp_ecn.c
index 579c0b407ae1..b0902ec31272 100644
--- a/sys/netinet/tcp_ecn.c
+++ b/sys/netinet/tcp_ecn.c
@@ -1,618 +1,618 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1994, 1995
  *      The Regents of the University of California.  All rights reserved.
  * Copyright (c) 2007-2008,2010
  *      Swinburne University of Technology, Melbourne, Australia.
  * Copyright (c) 2009-2010 Lawrence Stewart <lstewart@freebsd.org>
  * Copyright (c) 2010 The FreeBSD Foundation
  * Copyright (c) 2010-2011 Juniper Networks, Inc.
  * Copyright (c) 2019 Richard Scheffenegger <srichard@netapp.com>
  * All rights reserved.
  *
  * Portions of this software were developed at the Centre for Advanced Internet
  * Architectures, Swinburne University of Technology, by Lawrence Stewart,
  * James Healy and David Hayes, made possible in part by a grant from the Cisco
  * University Research Program Fund at Community Foundation Silicon Valley.
  *
  * Portions of this software were developed at the Centre for Advanced
  * Internet Architectures, Swinburne University of Technology, Melbourne,
  * Australia by David Hayes under sponsorship from the FreeBSD Foundation.
  *
  * Portions of this software were developed by Robert N. M. Watson under
  * contract to Juniper Networks, Inc.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  *      @(#)tcp_ecn.c 8.12 (Berkeley) 5/24/95
  */
 
 /*
  * Utility functions to deal with Explicit Congestion Notification in TCP
  * implementing the essential parts of the Accurate ECN extension
  * https://tools.ietf.org/html/draft-ietf-tcpm-accurate-ecn-09
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include "opt_inet.h"
 #include "opt_inet6.h"
 
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/kernel.h>
 #include <sys/sysctl.h>
 #include <sys/malloc.h>
 #include <sys/mbuf.h>
 #include <sys/socket.h>
 #include <sys/socketvar.h>
 
 #include <machine/cpu.h>
 
 #include <vm/uma.h>
 
 #include <net/if.h>
 #include <net/if_var.h>
 #include <net/route.h>
 #include <net/vnet.h>
 
 #include <netinet/in.h>
 #include <netinet/in_systm.h>
 #include <netinet/ip.h>
 #include <netinet/in_var.h>
 #include <netinet/in_pcb.h>
 #include <netinet/ip_var.h>
 #include <netinet/ip6.h>
 #include <netinet/icmp6.h>
 #include <netinet6/nd6.h>
 #include <netinet6/ip6_var.h>
 #include <netinet6/in6_pcb.h>
 #include <netinet/tcp.h>
 #include <netinet/tcp_fsm.h>
 #include <netinet/tcp_seq.h>
 #include <netinet/tcp_var.h>
 #include <netinet/tcp_syncache.h>
 #include <netinet/tcp_timer.h>
 #include <netinet/tcpip.h>
 #include <netinet/tcp_ecn.h>
 
 static SYSCTL_NODE(_net_inet_tcp, OID_AUTO, ecn,
     CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
     "TCP ECN");
 
 VNET_DEFINE(int, tcp_do_ecn) = 2;
 SYSCTL_INT(_net_inet_tcp_ecn, OID_AUTO, enable,
     CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(tcp_do_ecn), 0,
     "TCP ECN support");
 
 VNET_DEFINE(int, tcp_ecn_maxretries) = 1;
 SYSCTL_INT(_net_inet_tcp_ecn, OID_AUTO, maxretries,
     CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(tcp_ecn_maxretries), 0,
     "Max retries before giving up on ECN");
 
 /*
  * Process incoming SYN,ACK packet
  */
 void
 tcp_ecn_input_syn_sent(struct tcpcb *tp, uint16_t thflags, int iptos)
 {
 
 	if (V_tcp_do_ecn == 0)
 		return;
 	if ((V_tcp_do_ecn == 1) ||
 	    (V_tcp_do_ecn == 2)) {
 		/* RFC3168 ECN handling */
 		if ((thflags & (TH_CWR | TH_ECE)) == (0 | TH_ECE)) {
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 			tp->t_flags2 &= ~TF2_ACE_PERMIT;
 			TCPSTAT_INC(tcps_ecn_shs);
 		}
 	} else
 	/* decoding Accurate ECN according to table in section 3.1.1 */
 	if ((V_tcp_do_ecn == 3) ||
 	    (V_tcp_do_ecn == 4)) {
 		/*
 		 * on the SYN,ACK, process the AccECN
 		 * flags indicating the state the SYN
 		 * was delivered.
 		 * Reactions to Path ECN mangling can
 		 * come here.
 		 */
 		switch (thflags & (TH_AE | TH_CWR | TH_ECE)) {
 		/* RFC3168 SYN */
 		case (0|0|TH_ECE):
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 			tp->t_flags2 &= ~TF2_ACE_PERMIT;
 			TCPSTAT_INC(tcps_ecn_shs);
 			break;
 		/* non-ECT SYN */
 		case (0|TH_CWR|0):
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_flags2 &= ~TF2_ECN_PERMIT;
 			tp->t_scep = 5;
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_nect);
 			break;
 		/* ECT0 SYN */
 		case (TH_AE|0|0):
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_flags2 &= ~TF2_ECN_PERMIT;
 			tp->t_scep = 5;
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_ect0);
 			break;
 		/* ECT1 SYN */
 		case (0|TH_CWR|TH_ECE):
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_flags2 &= ~TF2_ECN_PERMIT;
 			tp->t_scep = 5;
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_ect1);
 			break;
 		/* CE SYN */
 		case (TH_AE|TH_CWR|0):
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_flags2 &= ~TF2_ECN_PERMIT;
 			tp->t_scep = 6;
 			/*
 			 * reduce the IW to 2 MSS (to
 			 * account for delayed acks) if
 			 * the SYN,ACK was CE marked
 			 */
 			tp->snd_cwnd = 2 * tcp_maxseg(tp);
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_nect);
 			break;
 		default:
 			tp->t_flags2 &= ~(TF2_ECN_PERMIT | TF2_ACE_PERMIT);
 			break;
 		}
 		/*
 		 * Set the AccECN Codepoints on
 		 * the outgoing <ACK> to the ECN
 		 * state of the <SYN,ACK>
 		 * according to table 3 in the
 		 * AccECN draft
 		 */
 		switch (iptos & IPTOS_ECN_MASK) {
 		case (IPTOS_ECN_NOTECT):
 			tp->t_rcep = 0b010;
 			break;
 		case (IPTOS_ECN_ECT0):
 			tp->t_rcep = 0b100;
 			break;
 		case (IPTOS_ECN_ECT1):
 			tp->t_rcep = 0b011;
 			break;
 		case (IPTOS_ECN_CE):
 			tp->t_rcep = 0b110;
 			break;
 		}
 	}
 }
 
 /*
  * Handle parallel SYN for ECN
  */
 void
 tcp_ecn_input_parallel_syn(struct tcpcb *tp, uint16_t thflags, int iptos)
 {
 	if (thflags & TH_ACK)
 		return;
 	if (V_tcp_do_ecn == 0)
 		return;
 	if ((V_tcp_do_ecn == 1) ||
 	    (V_tcp_do_ecn == 2)) {
 		/* RFC3168 ECN handling */
 		if ((thflags & (TH_CWR | TH_ECE)) == (TH_CWR | TH_ECE)) {
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 			tp->t_flags2 &= ~TF2_ACE_PERMIT;
 			tp->t_flags2 |= TF2_ECN_SND_ECE;
 			TCPSTAT_INC(tcps_ecn_shs);
 		}
 	} else
 	if ((V_tcp_do_ecn == 3) ||
 	    (V_tcp_do_ecn == 4)) {
 		/* AccECN handling */
 		switch (thflags & (TH_AE | TH_CWR | TH_ECE)) {
 		default:
 		case (0|0|0):
 			tp->t_flags2 &= ~(TF2_ECN_PERMIT | TF2_ACE_PERMIT);
 			break;
 		case (0|TH_CWR|TH_ECE):
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 			tp->t_flags2 &= ~TF2_ACE_PERMIT;
 			tp->t_flags2 |= TF2_ECN_SND_ECE;
 			TCPSTAT_INC(tcps_ecn_shs);
 			break;
 		case (TH_AE|TH_CWR|TH_ECE):
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_flags2 &= ~TF2_ECN_PERMIT;
 			TCPSTAT_INC(tcps_ecn_shs);
 			/*
 			 * Set the AccECN Codepoints on
 			 * the outgoing <ACK> to the ECN
 			 * state of the <SYN,ACK>
 			 * according to table 3 in the
 			 * AccECN draft
 			 */
 			switch (iptos & IPTOS_ECN_MASK) {
 			case (IPTOS_ECN_NOTECT):
 				tp->t_rcep = 0b010;
 				break;
 			case (IPTOS_ECN_ECT0):
 				tp->t_rcep = 0b100;
 				break;
 			case (IPTOS_ECN_ECT1):
 				tp->t_rcep = 0b011;
 				break;
 			case (IPTOS_ECN_CE):
 				tp->t_rcep = 0b110;
 				break;
 			}
 			break;
 		}
 	}
 }
 
 /*
  * TCP ECN processing.
  */
 int
 tcp_ecn_input_segment(struct tcpcb *tp, uint16_t thflags, int tlen, int pkts, int iptos)
 {
 	int delta_cep = 0;
 
 	switch (iptos & IPTOS_ECN_MASK) {
 	case IPTOS_ECN_CE:
 		TCPSTAT_INC(tcps_ecn_rcvce);
 		break;
 	case IPTOS_ECN_ECT0:
 		TCPSTAT_INC(tcps_ecn_rcvect0);
 		break;
 	case IPTOS_ECN_ECT1:
 		TCPSTAT_INC(tcps_ecn_rcvect1);
 		break;
 	}
 
 	if (tp->t_flags2 & (TF2_ECN_PERMIT | TF2_ACE_PERMIT)) {
 		if (tp->t_flags2 & TF2_ACE_PERMIT) {
 			if ((iptos & IPTOS_ECN_MASK) == IPTOS_ECN_CE)
 				tp->t_rcep += 1;
 			if (tp->t_flags2 & TF2_ECN_PERMIT) {
 				delta_cep = (tcp_ecn_get_ace(thflags) + 8 -
 					    (tp->t_scep & 7)) & 7;
 				if (delta_cep < pkts)
 					delta_cep = pkts -
 					    ((pkts - delta_cep) & 7);
 				tp->t_scep += delta_cep;
 			} else {
 				/*
 				 * process the final ACK of the 3WHS
 				 * see table 3 in draft-ietf-tcpm-accurate-ecn
 				 */
 				switch (tcp_ecn_get_ace(thflags)) {
 				case 0b010:
 					/* nonECT SYN or SYN,ACK */
-					/* Fallthrough */
+					/* FALLTHROUGH */
 				case 0b011:
 					/* ECT1 SYN or SYN,ACK */
-					/* Fallthrough */
+					/* FALLTHROUGH */
 				case 0b100:
 					/* ECT0 SYN or SYN,ACK */
 					tp->t_scep = 5;
 					break;
 				case 0b110:
 					/* CE SYN or SYN,ACK */
 					tp->t_scep = 6;
 					tp->snd_cwnd = 2 * tcp_maxseg(tp);
 					break;
 				default:
 					/* mangled AccECN handshake */
 					tp->t_scep = 5;
 					break;
 				}
 				tp->t_flags2 |= TF2_ECN_PERMIT;
 			}
 		} else {
 			/* RFC3168 ECN handling */
 			if ((thflags & (TH_SYN | TH_ECE)) == TH_ECE) {
 				delta_cep = 1;
 				tp->t_scep++;
 			}
 			if (thflags & TH_CWR) {
 				tp->t_flags2 &= ~TF2_ECN_SND_ECE;
 				tp->t_flags |= TF_ACKNOW;
 			}
 			if ((iptos & IPTOS_ECN_MASK) == IPTOS_ECN_CE)
 				tp->t_flags2 |= TF2_ECN_SND_ECE;
 		}
 
 		/* Process a packet differently from RFC3168. */
 		cc_ecnpkt_handler_flags(tp, thflags, iptos);
 	}
 
 	return delta_cep;
 }
 
 /*
  * Send ECN setup <SYN> packet header flags
  */
 uint16_t
 tcp_ecn_output_syn_sent(struct tcpcb *tp)
 {
 	uint16_t thflags = 0;
 
 	if (V_tcp_do_ecn == 0)
 		return thflags;
 	if (V_tcp_do_ecn == 1) {
 		/* Send a RFC3168 ECN setup <SYN> packet */
 		if (tp->t_rxtshift >= 1) {
 			if (tp->t_rxtshift <= V_tcp_ecn_maxretries)
 				thflags = TH_ECE|TH_CWR;
 		} else
 			thflags = TH_ECE|TH_CWR;
 	} else
 	if (V_tcp_do_ecn == 3) {
 		/* Send an Accurate ECN setup <SYN> packet */
 		if (tp->t_rxtshift >= 1) {
 			if (tp->t_rxtshift <= V_tcp_ecn_maxretries)
 				thflags = TH_ECE|TH_CWR|TH_AE;
 		} else
 			thflags = TH_ECE|TH_CWR|TH_AE;
 	}
 
 	return thflags;
 }
 
 /*
  * output processing of ECN feature
  * returning IP ECN header codepoint
  */
 int
 tcp_ecn_output_established(struct tcpcb *tp, uint16_t *thflags, int len, bool rxmit)
 {
 	int ipecn = IPTOS_ECN_NOTECT;
 	bool newdata;
 
 	/*
 	 * If the peer has ECN, mark data packets with
 	 * ECN capable transmission (ECT).
 	 * Ignore pure control packets, retransmissions
 	 * and window probes.
 	 */
 	newdata = (len > 0 && SEQ_GEQ(tp->snd_nxt, tp->snd_max) &&
 		    !rxmit &&
 		    !((tp->t_flags & TF_FORCEDATA) && len == 1));
 	/* RFC3168 ECN marking, only new data segments */
 	if (newdata) {
 		if (tp->t_flags2 & TF2_ECN_USE_ECT1) {
 			ipecn = IPTOS_ECN_ECT1;
 			TCPSTAT_INC(tcps_ecn_sndect1);
 		} else {
 			ipecn = IPTOS_ECN_ECT0;
 			TCPSTAT_INC(tcps_ecn_sndect0);
 		}
 	}
 	/*
 	 * Reply with proper ECN notifications.
 	 */
 	if (tp->t_flags2 & TF2_ACE_PERMIT) {
 		*thflags &= ~(TH_AE|TH_CWR|TH_ECE);
 		if (tp->t_rcep & 0x01)
 			*thflags |= TH_ECE;
 		if (tp->t_rcep & 0x02)
 			*thflags |= TH_CWR;
 		if (tp->t_rcep & 0x04)
 			*thflags |= TH_AE;
 		if (!(tp->t_flags2 & TF2_ECN_PERMIT)) {
 			/*
 			 * here we process the final
 			 * ACK of the 3WHS
 			 */
 			if (tp->t_rcep == 0b110) {
 				tp->t_rcep = 6;
 			} else {
 				tp->t_rcep = 5;
 			}
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 		}
 	} else {
 		if (newdata &&
 		    (tp->t_flags2 & TF2_ECN_SND_CWR)) {
 			*thflags |= TH_CWR;
 			tp->t_flags2 &= ~TF2_ECN_SND_CWR;
 		}
 		if (tp->t_flags2 & TF2_ECN_SND_ECE)
 			*thflags |= TH_ECE;
 	}
 
 	return ipecn;
 }
 
 /*
  * Set up the ECN related tcpcb fields from
  * a syncache entry
  */
 void
 tcp_ecn_syncache_socket(struct tcpcb *tp, struct syncache *sc)
 {
 	if (sc->sc_flags & SCF_ECN_MASK) {
 		switch (sc->sc_flags & SCF_ECN_MASK) {
 		case SCF_ECN:
 			tp->t_flags2 |= TF2_ECN_PERMIT;
 			break;
 		case SCF_ACE_N:
-			/* Fallthrough */
+			/* FALLTHROUGH */
 		case SCF_ACE_0:
-			/* Fallthrough */
+			/* FALLTHROUGH */
 		case SCF_ACE_1:
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_scep = 5;
 			tp->t_rcep = 5;
 			break;
 		case SCF_ACE_CE:
 			tp->t_flags2 |= TF2_ACE_PERMIT;
 			tp->t_scep = 6;
 			tp->t_rcep = 6;
 			break;
 		/* undefined SCF codepoint */
 		default:
 			break;
 		}
 	}
 }
 
 /*
  * Process a <SYN> packets ECN information, and provide the
  * syncache with the relevant information.
  */
 int
 tcp_ecn_syncache_add(uint16_t thflags, int iptos)
 {
 	int scflags = 0;
 
 	switch (iptos & IPTOS_ECN_MASK) {
 	case IPTOS_ECN_CE:
 		TCPSTAT_INC(tcps_ecn_rcvce);
 		break;
 	case IPTOS_ECN_ECT0:
 		TCPSTAT_INC(tcps_ecn_rcvect0);
 		break;
 	case IPTOS_ECN_ECT1:
 		TCPSTAT_INC(tcps_ecn_rcvect1);
 		break;
 	}
 
 	switch (thflags & (TH_AE|TH_CWR|TH_ECE)) {
 	/* no ECN */
 	case (0|0|0):
 		break;
 	/* legacy ECN */
 	case (0|TH_CWR|TH_ECE):
 		scflags = SCF_ECN;
 		break;
 	/* Accurate ECN */
 	case (TH_AE|TH_CWR|TH_ECE):
 		if ((V_tcp_do_ecn == 3) ||
 		    (V_tcp_do_ecn == 4)) {
 			switch (iptos & IPTOS_ECN_MASK) {
 			case IPTOS_ECN_CE:
 				scflags = SCF_ACE_CE;
 				break;
 			case IPTOS_ECN_ECT0:
 				scflags = SCF_ACE_0;
 				break;
 			case IPTOS_ECN_ECT1:
 				scflags = SCF_ACE_1;
 				break;
 			case IPTOS_ECN_NOTECT:
 				scflags = SCF_ACE_N;
 				break;
 			}
 		} else
 			scflags = SCF_ECN;
 		break;
 	/* Default Case (section 3.1.2) */
 	default:
 		if ((V_tcp_do_ecn == 3) ||
 		    (V_tcp_do_ecn == 4)) {
 			switch (iptos & IPTOS_ECN_MASK) {
 			case IPTOS_ECN_CE:
 				scflags = SCF_ACE_CE;
 				break;
 			case IPTOS_ECN_ECT0:
 				scflags = SCF_ACE_0;
 				break;
 			case IPTOS_ECN_ECT1:
 				scflags = SCF_ACE_1;
 				break;
 			case IPTOS_ECN_NOTECT:
 				scflags = SCF_ACE_N;
 				break;
 			}
 		}
 		break;
 	}
 	return scflags;
 }
 
 /*
  * Set up the ECN information for the <SYN,ACK> from
  * syncache information.
  */
 uint16_t
 tcp_ecn_syncache_respond(uint16_t thflags, struct syncache *sc)
 {
 	if ((thflags & TH_SYN) &&
 	    (sc->sc_flags & SCF_ECN_MASK)) {
 		switch (sc->sc_flags & SCF_ECN_MASK) {
 		case SCF_ECN:
 			thflags |= (0 | 0 | TH_ECE);
 			TCPSTAT_INC(tcps_ecn_shs);
 			break;
 		case SCF_ACE_N:
 			thflags |= (0 | TH_CWR | 0);
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_nect);
 			break;
 		case SCF_ACE_0:
 			thflags |= (TH_AE | 0 | 0);
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_ect0);
 			break;
 		case SCF_ACE_1:
 			thflags |= (0 | TH_ECE | TH_CWR);
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_ect1);
 			break;
 		case SCF_ACE_CE:
 			thflags |= (TH_AE | TH_CWR | 0);
 			TCPSTAT_INC(tcps_ecn_shs);
 			TCPSTAT_INC(tcps_ace_ce);
 			break;
 		/* undefined SCF codepoint */
 		default:
 			break;
 		}
 	}
 	return thflags;
 }
 
 int
 tcp_ecn_get_ace(uint16_t thflags)
 {
 	int ace = 0;
 
 	if (thflags & TH_ECE)
 		ace += 1;
 	if (thflags & TH_CWR)
 		ace += 2;
 	if (thflags & TH_AE)
 		ace += 4;
 	return ace;
 }
diff --git a/sys/netinet/tcp_log_buf.c b/sys/netinet/tcp_log_buf.c
index e0334c69b46f..be15c6735fca 100644
--- a/sys/netinet/tcp_log_buf.c
+++ b/sys/netinet/tcp_log_buf.c
@@ -1,2974 +1,2974 @@
 
 /*-
  * SPDX-License-Identifier: BSD-2-Clause
  *
  * Copyright (c) 2016-2018 Netflix, Inc.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include "opt_inet.h"
 #include <sys/param.h>
 #include <sys/arb.h>
 #include <sys/hash.h>
 #include <sys/kernel.h>
 #include <sys/lock.h>
 #include <sys/malloc.h>
 #include <sys/mutex.h>
 #include <sys/qmath.h>
 #include <sys/queue.h>
 #include <sys/refcount.h>
 #include <sys/rwlock.h>
 #include <sys/socket.h>
 #include <sys/socketvar.h>
 #include <sys/sysctl.h>
 #include <sys/tree.h>
 #include <sys/stats.h> /* Must come after qmath.h and tree.h */
 #include <sys/counter.h>
 #include <dev/tcp_log/tcp_log_dev.h>
 
 #include <net/if.h>
 #include <net/if_var.h>
 #include <net/vnet.h>
 
 #include <netinet/in.h>
 #include <netinet/in_pcb.h>
 #include <netinet/in_var.h>
 #include <netinet/tcp_var.h>
 #include <netinet/tcp_log_buf.h>
 #include <netinet/tcp_seq.h>
 #include <netinet/tcp_hpts.h>
 
 /* Default expiry time */
 #define	TCP_LOG_EXPIRE_TIME	((sbintime_t)60 * SBT_1S)
 
 /* Max interval at which to run the expiry timer */
 #define	TCP_LOG_EXPIRE_INTVL	((sbintime_t)5 * SBT_1S)
 
 bool	tcp_log_verbose;
 static uma_zone_t tcp_log_id_bucket_zone, tcp_log_id_node_zone, tcp_log_zone;
 static int	tcp_log_session_limit = TCP_LOG_BUF_DEFAULT_SESSION_LIMIT;
 static uint32_t	tcp_log_version = TCP_LOG_BUF_VER;
 RB_HEAD(tcp_log_id_tree, tcp_log_id_bucket);
 static struct tcp_log_id_tree tcp_log_id_head;
 static STAILQ_HEAD(, tcp_log_id_node) tcp_log_expireq_head =
     STAILQ_HEAD_INITIALIZER(tcp_log_expireq_head);
 static struct mtx tcp_log_expireq_mtx;
 static struct callout tcp_log_expireq_callout;
 static u_long tcp_log_auto_ratio = 0;
 static volatile u_long tcp_log_auto_ratio_cur = 0;
 static uint32_t tcp_log_auto_mode = TCP_LOG_STATE_TAIL;
 static bool tcp_log_auto_all = false;
 static uint32_t tcp_disable_all_bb_logs = 0;
 
 RB_PROTOTYPE_STATIC(tcp_log_id_tree, tcp_log_id_bucket, tlb_rb, tcp_log_id_cmp)
 
 SYSCTL_NODE(_net_inet_tcp, OID_AUTO, bb, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
     "TCP Black Box controls");
 
 SYSCTL_NODE(_net_inet_tcp_bb, OID_AUTO, tp, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
     "TCP Black Box Trace Point controls");
 
 SYSCTL_BOOL(_net_inet_tcp_bb, OID_AUTO, log_verbose, CTLFLAG_RW, &tcp_log_verbose,
     0, "Force verbose logging for TCP traces");
 
 SYSCTL_INT(_net_inet_tcp_bb, OID_AUTO, log_session_limit,
     CTLFLAG_RW, &tcp_log_session_limit, 0,
     "Maximum number of events maintained for each TCP session");
 
 uint32_t tcp_trace_point_config = 0;
 SYSCTL_U32(_net_inet_tcp_bb_tp, OID_AUTO, number, CTLFLAG_RW,
     &tcp_trace_point_config, TCP_LOG_STATE_HEAD_AUTO,
     "What is the trace point number to activate (0=none, 0xffffffff = all)?");
 
 uint32_t tcp_trace_point_bb_mode = TCP_LOG_STATE_CONTINUAL;
 SYSCTL_U32(_net_inet_tcp_bb_tp, OID_AUTO, bbmode, CTLFLAG_RW,
     &tcp_trace_point_bb_mode, TCP_LOG_STATE_HEAD_AUTO,
     "What is BB logging mode that is activated?");
 
 int32_t tcp_trace_point_count = 0;
 SYSCTL_U32(_net_inet_tcp_bb_tp, OID_AUTO, count, CTLFLAG_RW,
     &tcp_trace_point_count, TCP_LOG_STATE_HEAD_AUTO,
     "How many connections will have BB logging turned on that hit the tracepoint?");
 
 
 
 SYSCTL_UMA_MAX(_net_inet_tcp_bb, OID_AUTO, log_global_limit, CTLFLAG_RW,
     &tcp_log_zone, "Maximum number of events maintained for all TCP sessions");
 
 SYSCTL_UMA_CUR(_net_inet_tcp_bb, OID_AUTO, log_global_entries, CTLFLAG_RD,
     &tcp_log_zone, "Current number of events maintained for all TCP sessions");
 
 SYSCTL_UMA_MAX(_net_inet_tcp_bb, OID_AUTO, log_id_limit, CTLFLAG_RW,
     &tcp_log_id_bucket_zone, "Maximum number of log IDs");
 
 SYSCTL_UMA_CUR(_net_inet_tcp_bb, OID_AUTO, log_id_entries, CTLFLAG_RD,
     &tcp_log_id_bucket_zone, "Current number of log IDs");
 
 SYSCTL_UMA_MAX(_net_inet_tcp_bb, OID_AUTO, log_id_tcpcb_limit, CTLFLAG_RW,
     &tcp_log_id_node_zone, "Maximum number of tcpcbs with log IDs");
 
 SYSCTL_UMA_CUR(_net_inet_tcp_bb, OID_AUTO, log_id_tcpcb_entries, CTLFLAG_RD,
     &tcp_log_id_node_zone, "Current number of tcpcbs with log IDs");
 
 SYSCTL_U32(_net_inet_tcp_bb, OID_AUTO, log_version, CTLFLAG_RD, &tcp_log_version,
     0, "Version of log formats exported");
 
 SYSCTL_U32(_net_inet_tcp_bb, OID_AUTO, disable_all, CTLFLAG_RW,
     &tcp_disable_all_bb_logs, 0,
     "Disable all BB logging for all connections");
 
 SYSCTL_ULONG(_net_inet_tcp_bb, OID_AUTO, log_auto_ratio, CTLFLAG_RW,
     &tcp_log_auto_ratio, 0, "Do auto capturing for 1 out of N sessions");
 
 SYSCTL_U32(_net_inet_tcp_bb, OID_AUTO, log_auto_mode, CTLFLAG_RW,
     &tcp_log_auto_mode, 0,
     "Logging mode for auto-selected sessions (default is TCP_LOG_STATE_TAIL)");
 
 SYSCTL_BOOL(_net_inet_tcp_bb, OID_AUTO, log_auto_all, CTLFLAG_RW,
     &tcp_log_auto_all, 0,
     "Auto-select from all sessions (rather than just those with IDs)");
 
 #ifdef TCPLOG_DEBUG_COUNTERS
 counter_u64_t tcp_log_queued;
 counter_u64_t tcp_log_que_fail1;
 counter_u64_t tcp_log_que_fail2;
 counter_u64_t tcp_log_que_fail3;
 counter_u64_t tcp_log_que_fail4;
 counter_u64_t tcp_log_que_fail5;
 counter_u64_t tcp_log_que_copyout;
 counter_u64_t tcp_log_que_read;
 counter_u64_t tcp_log_que_freed;
 
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, queued, CTLFLAG_RD,
     &tcp_log_queued, "Number of entries queued");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, fail1, CTLFLAG_RD,
     &tcp_log_que_fail1, "Number of entries queued but fail 1");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, fail2, CTLFLAG_RD,
     &tcp_log_que_fail2, "Number of entries queued but fail 2");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, fail3, CTLFLAG_RD,
     &tcp_log_que_fail3, "Number of entries queued but fail 3");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, fail4, CTLFLAG_RD,
     &tcp_log_que_fail4, "Number of entries queued but fail 4");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, fail5, CTLFLAG_RD,
     &tcp_log_que_fail5, "Number of entries queued but fail 4");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, copyout, CTLFLAG_RD,
     &tcp_log_que_copyout, "Number of entries copied out");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, read, CTLFLAG_RD,
     &tcp_log_que_read, "Number of entries read from the queue");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, freed, CTLFLAG_RD,
     &tcp_log_que_freed, "Number of entries freed after reading");
 #endif
 
 #ifdef INVARIANTS
 #define	TCPLOG_DEBUG_RINGBUF
 #endif
 /* Number of requests to consider a PBCID "active". */
 #define	ACTIVE_REQUEST_COUNT	10
 
 /* Statistic tracking for "active" PBCIDs. */
 static counter_u64_t tcp_log_pcb_ids_cur;
 static counter_u64_t tcp_log_pcb_ids_tot;
 
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, pcb_ids_cur, CTLFLAG_RD,
     &tcp_log_pcb_ids_cur, "Number of pcb IDs allocated in the system");
 SYSCTL_COUNTER_U64(_net_inet_tcp_bb, OID_AUTO, pcb_ids_tot, CTLFLAG_RD,
     &tcp_log_pcb_ids_tot, "Total number of pcb IDs that have been allocated");
 
 struct tcp_log_mem
 {
 	STAILQ_ENTRY(tcp_log_mem) tlm_queue;
 	struct tcp_log_buffer	tlm_buf;
 	struct tcp_log_verbose	tlm_v;
 #ifdef TCPLOG_DEBUG_RINGBUF
 	volatile int		tlm_refcnt;
 #endif
 };
 
 /* 60 bytes for the header, + 16 bytes for padding */
 static uint8_t	zerobuf[76];
 
 /*
  * Lock order:
  * 1. TCPID_TREE
  * 2. TCPID_BUCKET
  * 3. INP
  *
  * Rules:
  * A. You need a lock on the Tree to add/remove buckets.
  * B. You need a lock on the bucket to add/remove nodes from the bucket.
  * C. To change information in a node, you need the INP lock if the tln_closed
  *    field is false. Otherwise, you need the bucket lock. (Note that the
  *    tln_closed field can change at any point, so you need to recheck the
  *    entry after acquiring the INP lock.)
  * D. To remove a node from the bucket, you must have that entry locked,
  *    according to the criteria of Rule C. Also, the node must not be on
  *    the expiry queue.
  * E. The exception to C is the expiry queue fields, which are locked by
  *    the TCPLOG_EXPIREQ lock.
  *
  * Buckets have a reference count. Each node is a reference. Further,
  * other callers may add reference counts to keep a bucket from disappearing.
  * You can add a reference as long as you own a lock sufficient to keep the
  * bucket from disappearing. For example, a common use is:
  *   a. Have a locked INP, but need to lock the TCPID_BUCKET.
  *   b. Add a refcount on the bucket. (Safe because the INP lock prevents
  *      the TCPID_BUCKET from going away.)
  *   c. Drop the INP lock.
  *   d. Acquire a lock on the TCPID_BUCKET.
  *   e. Acquire a lock on the INP.
  *   f. Drop the refcount on the bucket.
  *      (At this point, the bucket may disappear.)
  *
  * Expire queue lock:
  * You can acquire this with either the bucket or INP lock. Don't reverse it.
  * When the expire code has committed to freeing a node, it resets the expiry
  * time to SBT_MAX. That is the signal to everyone else that they should
  * leave that node alone.
  */
 static struct rwlock tcp_id_tree_lock;
 #define	TCPID_TREE_WLOCK()		rw_wlock(&tcp_id_tree_lock)
 #define	TCPID_TREE_RLOCK()		rw_rlock(&tcp_id_tree_lock)
 #define	TCPID_TREE_UPGRADE()		rw_try_upgrade(&tcp_id_tree_lock)
 #define	TCPID_TREE_WUNLOCK()		rw_wunlock(&tcp_id_tree_lock)
 #define	TCPID_TREE_RUNLOCK()		rw_runlock(&tcp_id_tree_lock)
 #define	TCPID_TREE_WLOCK_ASSERT()	rw_assert(&tcp_id_tree_lock, RA_WLOCKED)
 #define	TCPID_TREE_RLOCK_ASSERT()	rw_assert(&tcp_id_tree_lock, RA_RLOCKED)
 #define	TCPID_TREE_UNLOCK_ASSERT()	rw_assert(&tcp_id_tree_lock, RA_UNLOCKED)
 
 #define	TCPID_BUCKET_LOCK_INIT(tlb)	mtx_init(&((tlb)->tlb_mtx), "tcp log id bucket", NULL, MTX_DEF)
 #define	TCPID_BUCKET_LOCK_DESTROY(tlb)	mtx_destroy(&((tlb)->tlb_mtx))
 #define	TCPID_BUCKET_LOCK(tlb)		mtx_lock(&((tlb)->tlb_mtx))
 #define	TCPID_BUCKET_UNLOCK(tlb)	mtx_unlock(&((tlb)->tlb_mtx))
 #define	TCPID_BUCKET_LOCK_ASSERT(tlb)	mtx_assert(&((tlb)->tlb_mtx), MA_OWNED)
 #define	TCPID_BUCKET_UNLOCK_ASSERT(tlb) mtx_assert(&((tlb)->tlb_mtx), MA_NOTOWNED)
 
 #define	TCPID_BUCKET_REF(tlb)		refcount_acquire(&((tlb)->tlb_refcnt))
 #define	TCPID_BUCKET_UNREF(tlb)		refcount_release(&((tlb)->tlb_refcnt))
 
 #define	TCPLOG_EXPIREQ_LOCK()		mtx_lock(&tcp_log_expireq_mtx)
 #define	TCPLOG_EXPIREQ_UNLOCK()		mtx_unlock(&tcp_log_expireq_mtx)
 
 SLIST_HEAD(tcp_log_id_head, tcp_log_id_node);
 
 struct tcp_log_id_bucket
 {
 	/*
 	 * tlb_id must be first. This lets us use strcmp on
 	 * (struct tcp_log_id_bucket *) and (char *) interchangeably.
 	 */
 	char				tlb_id[TCP_LOG_ID_LEN];
 	char				tlb_tag[TCP_LOG_TAG_LEN];
 	RB_ENTRY(tcp_log_id_bucket)	tlb_rb;
 	struct tcp_log_id_head		tlb_head;
 	struct mtx			tlb_mtx;
 	volatile u_int			tlb_refcnt;
 	volatile u_int			tlb_reqcnt;
 	uint32_t			tlb_loglimit;
 	int8_t				tlb_logstate;
 };
 
 struct tcp_log_id_node
 {
 	SLIST_ENTRY(tcp_log_id_node) tln_list;
 	STAILQ_ENTRY(tcp_log_id_node) tln_expireq; /* Locked by the expireq lock */
 	sbintime_t		tln_expiretime;	/* Locked by the expireq lock */
 
 	/*
 	 * If INP is NULL, that means the connection has closed. We've
 	 * saved the connection endpoint information and the log entries
 	 * in the tln_ie and tln_entries members. We've also saved a pointer
 	 * to the enclosing bucket here. If INP is not NULL, the information is
 	 * in the PCB and not here.
 	 */
 	struct inpcb		*tln_inp;
 	struct tcpcb		*tln_tp;
 	struct tcp_log_id_bucket *tln_bucket;
 	struct in_endpoints	tln_ie;
 	struct tcp_log_stailq	tln_entries;
 	int			tln_count;
 	volatile int		tln_closed;
 	uint8_t			tln_af;
 };
 
 enum tree_lock_state {
 	TREE_UNLOCKED = 0,
 	TREE_RLOCKED,
 	TREE_WLOCKED,
 };
 
 /* Do we want to select this session for auto-logging? */
 static __inline bool
 tcp_log_selectauto(void)
 {
 
 	/*
 	 * If we are doing auto-capturing, figure out whether we will capture
 	 * this session.
 	 */
 	if (tcp_log_auto_ratio &&
 	    (tcp_disable_all_bb_logs == 0) &&
 	    (atomic_fetchadd_long(&tcp_log_auto_ratio_cur, 1) %
 	    tcp_log_auto_ratio) == 0)
 		return (true);
 	return (false);
 }
 
 static __inline int
 tcp_log_id_cmp(struct tcp_log_id_bucket *a, struct tcp_log_id_bucket *b)
 {
 	KASSERT(a != NULL, ("tcp_log_id_cmp: argument a is unexpectedly NULL"));
 	KASSERT(b != NULL, ("tcp_log_id_cmp: argument b is unexpectedly NULL"));
 	return strncmp(a->tlb_id, b->tlb_id, TCP_LOG_ID_LEN);
 }
 
 RB_GENERATE_STATIC(tcp_log_id_tree, tcp_log_id_bucket, tlb_rb, tcp_log_id_cmp)
 
 static __inline void
 tcp_log_id_validate_tree_lock(int tree_locked)
 {
 
 #ifdef INVARIANTS
 	switch (tree_locked) {
 	case TREE_WLOCKED:
 		TCPID_TREE_WLOCK_ASSERT();
 		break;
 	case TREE_RLOCKED:
 		TCPID_TREE_RLOCK_ASSERT();
 		break;
 	case TREE_UNLOCKED:
 		TCPID_TREE_UNLOCK_ASSERT();
 		break;
 	default:
 		kassert_panic("%s:%d: unknown tree lock state", __func__,
 		    __LINE__);
 	}
 #endif
 }
 
 static __inline void
 tcp_log_remove_bucket(struct tcp_log_id_bucket *tlb)
 {
 
 	TCPID_TREE_WLOCK_ASSERT();
 	KASSERT(SLIST_EMPTY(&tlb->tlb_head),
 	    ("%s: Attempt to remove non-empty bucket", __func__));
 	if (RB_REMOVE(tcp_log_id_tree, &tcp_log_id_head, tlb) == NULL) {
 #ifdef INVARIANTS
 		kassert_panic("%s:%d: error removing element from tree",
 			    __func__, __LINE__);
 #endif
 	}
 	TCPID_BUCKET_LOCK_DESTROY(tlb);
 	counter_u64_add(tcp_log_pcb_ids_cur, (int64_t)-1);
 	uma_zfree(tcp_log_id_bucket_zone, tlb);
 }
 
 /*
  * Call with a referenced and locked bucket.
  * Will return true if the bucket was freed; otherwise, false.
  * tlb: The bucket to unreference.
  * tree_locked: A pointer to the state of the tree lock. If the tree lock
  *    state changes, the function will update it.
  * inp: If not NULL and the function needs to drop the inp lock to relock the
  *    tree, it will do so. (The caller must ensure inp will not become invalid,
  *    probably by holding a reference to it.)
  */
 static bool
 tcp_log_unref_bucket(struct tcp_log_id_bucket *tlb, int *tree_locked,
     struct inpcb *inp)
 {
 
 	KASSERT(tlb != NULL, ("%s: called with NULL tlb", __func__));
 	KASSERT(tree_locked != NULL, ("%s: called with NULL tree_locked",
 	    __func__));
 
 	tcp_log_id_validate_tree_lock(*tree_locked);
 
 	/*
 	 * Did we hold the last reference on the tlb? If so, we may need
 	 * to free it. (Note that we can realistically only execute the
 	 * loop twice: once without a write lock and once with a write
 	 * lock.)
 	 */
 	while (TCPID_BUCKET_UNREF(tlb)) {
 		/*
 		 * We need a write lock on the tree to free this.
 		 * If we can upgrade the tree lock, this is "easy". If we
 		 * can't upgrade the tree lock, we need to do this the
 		 * "hard" way: unwind all our locks and relock everything.
 		 * In the meantime, anything could have changed. We even
 		 * need to validate that we still need to free the bucket.
 		 */
 		if (*tree_locked == TREE_RLOCKED && TCPID_TREE_UPGRADE())
 			*tree_locked = TREE_WLOCKED;
 		else if (*tree_locked != TREE_WLOCKED) {
 			TCPID_BUCKET_REF(tlb);
 			if (inp != NULL)
 				INP_WUNLOCK(inp);
 			TCPID_BUCKET_UNLOCK(tlb);
 			if (*tree_locked == TREE_RLOCKED)
 				TCPID_TREE_RUNLOCK();
 			TCPID_TREE_WLOCK();
 			*tree_locked = TREE_WLOCKED;
 			TCPID_BUCKET_LOCK(tlb);
 			if (inp != NULL)
 				INP_WLOCK(inp);
 			continue;
 		}
 
 		/*
 		 * We have an empty bucket and a write lock on the tree.
 		 * Remove the empty bucket.
 		 */
 		tcp_log_remove_bucket(tlb);
 		return (true);
 	}
 	return (false);
 }
 
 /*
  * Call with a locked bucket. This function will release the lock on the
  * bucket before returning.
  *
  * The caller is responsible for freeing the tp->t_lin/tln node!
  *
  * Note: one of tp or both tlb and tln must be supplied.
  *
  * inp: A pointer to the inp. If the function needs to drop the inp lock to
  *    acquire the tree write lock, it will do so. (The caller must ensure inp
  *    will not become invalid, probably by holding a reference to it.)
  * tp: A pointer to the tcpcb. (optional; if specified, tlb and tln are ignored)
  * tlb: A pointer to the bucket. (optional; ignored if tp is specified)
  * tln: A pointer to the node. (optional; ignored if tp is specified)
  * tree_locked: A pointer to the state of the tree lock. If the tree lock
  *    state changes, the function will update it.
  *
  * Will return true if the INP lock was reacquired; otherwise, false.
  */
 static bool
 tcp_log_remove_id_node(struct inpcb *inp, struct tcpcb *tp,
     struct tcp_log_id_bucket *tlb, struct tcp_log_id_node *tln,
     int *tree_locked)
 {
 	int orig_tree_locked;
 
 	KASSERT(tp != NULL || (tlb != NULL && tln != NULL),
 	    ("%s: called with tp=%p, tlb=%p, tln=%p", __func__,
 	    tp, tlb, tln));
 	KASSERT(tree_locked != NULL, ("%s: called with NULL tree_locked",
 	    __func__));
 
 	if (tp != NULL) {
 		tlb = tp->t_lib;
 		tln = tp->t_lin;
 		KASSERT(tlb != NULL, ("%s: unexpectedly NULL tlb", __func__));
 		KASSERT(tln != NULL, ("%s: unexpectedly NULL tln", __func__));
 	}
 
 	tcp_log_id_validate_tree_lock(*tree_locked);
 	TCPID_BUCKET_LOCK_ASSERT(tlb);
 
 	/*
 	 * Remove the node, clear the log bucket and node from the TCPCB, and
 	 * decrement the bucket refcount. In the process, if this is the
 	 * last reference, the bucket will be freed.
 	 */
 	SLIST_REMOVE(&tlb->tlb_head, tln, tcp_log_id_node, tln_list);
 	if (tp != NULL) {
 		tp->t_lib = NULL;
 		tp->t_lin = NULL;
 	}
 	orig_tree_locked = *tree_locked;
 	if (!tcp_log_unref_bucket(tlb, tree_locked, inp))
 		TCPID_BUCKET_UNLOCK(tlb);
 	return (*tree_locked != orig_tree_locked);
 }
 
 #define	RECHECK_INP_CLEAN(cleanup)	do {			\
 	if (inp->inp_flags & INP_DROPPED) {			\
 		rv = ECONNRESET;				\
 		cleanup;					\
 		goto done;					\
 	}							\
 	tp = intotcpcb(inp);					\
 } while (0)
 
 #define	RECHECK_INP()	RECHECK_INP_CLEAN(/* noop */)
 
 static void
 tcp_log_grow_tlb(char *tlb_id, struct tcpcb *tp)
 {
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 #ifdef STATS
 	if (V_tcp_perconn_stats_enable == 2 && tp->t_stats == NULL)
 		(void)tcp_stats_sample_rollthedice(tp, tlb_id, strlen(tlb_id));
 #endif
 }
 
 static void
 tcp_log_increment_reqcnt(struct tcp_log_id_bucket *tlb)
 {
 
 	atomic_fetchadd_int(&tlb->tlb_reqcnt, 1);
 }
 
 int
 tcp_log_apply_ratio(struct tcpcb *tp, int ratio)
 {
 	struct tcp_log_id_bucket *tlb;
 	struct inpcb *inp = tptoinpcb(tp);
 	uint32_t hash, ratio_hash_thresh;
 	int rv, tree_locked;
 
 	rv = 0;
 	tree_locked = TREE_UNLOCKED;
 	tlb = tp->t_lib;
 
 	INP_WLOCK_ASSERT(inp);
 	if (tlb == NULL) {
 		INP_WUNLOCK(inp);
 		return (EOPNOTSUPP);
 	}
 	if (ratio)
 		ratio_hash_thresh = max(1, UINT32_MAX / ratio);
 	else
 		ratio_hash_thresh = 0;
 	TCPID_BUCKET_REF(tlb);
 	INP_WUNLOCK(inp);
 	TCPID_BUCKET_LOCK(tlb);
 
 	hash = hash32_buf(tlb->tlb_id, strlen(tlb->tlb_id), 0);
 	if (hash > ratio_hash_thresh && tp->_t_logstate == TCP_LOG_STATE_OFF &&
 	    tlb->tlb_logstate == TCP_LOG_STATE_OFF) {
 		/*
 		 * Ratio decision not to log this log ID (and this connection by
 		 * way of association). We only apply a log ratio log disable
 		 * decision if it would not interfere with a log enable decision
 		 * made elsewhere e.g. tcp_log_selectauto() or setsockopt().
 		 */
 		tlb->tlb_logstate = TCP_LOG_STATE_RATIO_OFF;
 		INP_WLOCK(inp);
 		RECHECK_INP();
 		(void)tcp_log_state_change(tp, TCP_LOG_STATE_OFF);
 done:
 		INP_WUNLOCK(inp);
 	}
 
 	INP_UNLOCK_ASSERT(inp);
 	if (!tcp_log_unref_bucket(tlb, &tree_locked, NULL))
 		TCPID_BUCKET_UNLOCK(tlb);
 
 	if (tree_locked == TREE_WLOCKED) {
 		TCPID_TREE_WLOCK_ASSERT();
 		TCPID_TREE_WUNLOCK();
 	} else if (tree_locked == TREE_RLOCKED) {
 		TCPID_TREE_RLOCK_ASSERT();
 		TCPID_TREE_RUNLOCK();
 	} else
 		TCPID_TREE_UNLOCK_ASSERT();
 
 	return (rv);
 }
 
 /*
  * Associate the specified tag with a particular TCP log ID.
  * Called with INPCB locked. Returns with it unlocked.
  * Returns 0 on success or EOPNOTSUPP if the connection has no TCP log ID.
  */
 int
 tcp_log_set_tag(struct tcpcb *tp, char *tag)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_log_id_bucket *tlb;
 	int tree_locked;
 
 	INP_WLOCK_ASSERT(inp);
 
 	tree_locked = TREE_UNLOCKED;
 	tlb = tp->t_lib;
 	if (tlb == NULL) {
 		INP_WUNLOCK(inp);
 		return (EOPNOTSUPP);
 	}
 
 	TCPID_BUCKET_REF(tlb);
 	INP_WUNLOCK(inp);
 	TCPID_BUCKET_LOCK(tlb);
 	strlcpy(tlb->tlb_tag, tag, TCP_LOG_TAG_LEN);
 	if (!tcp_log_unref_bucket(tlb, &tree_locked, NULL))
 		TCPID_BUCKET_UNLOCK(tlb);
 
 	if (tree_locked == TREE_WLOCKED) {
 		TCPID_TREE_WLOCK_ASSERT();
 		TCPID_TREE_WUNLOCK();
 	} else if (tree_locked == TREE_RLOCKED) {
 		TCPID_TREE_RLOCK_ASSERT();
 		TCPID_TREE_RUNLOCK();
 	} else
 		TCPID_TREE_UNLOCK_ASSERT();
 
 	return (0);
 }
 
 /*
  * Set the TCP log ID for a TCPCB.
  * Called with INPCB locked. Returns with it unlocked.
  */
 int
 tcp_log_set_id(struct tcpcb *tp, char *id)
 {
 	struct tcp_log_id_bucket *tlb, *tmp_tlb;
 	struct tcp_log_id_node *tln;
 	struct inpcb *inp = tptoinpcb(tp);
 	int tree_locked, rv;
 	bool bucket_locked, same;
 
 	tlb = NULL;
 	tln = NULL;
 	tree_locked = TREE_UNLOCKED;
 	bucket_locked = false;
 
 restart:
 	INP_WLOCK_ASSERT(inp);
 	/* See if the ID is unchanged. */
 	same = ((tp->t_lib != NULL && !strcmp(tp->t_lib->tlb_id, id)) ||
 		(tp->t_lib == NULL && *id == 0));
 	if (tp->_t_logstate && STAILQ_FIRST(&tp->t_logs) && !same) {
 		/*
 		 * There are residual logs left we may
 		 * be changing id's so dump what we can.
 		 */
 		switch(tp->_t_logstate) {
 		case TCP_LOG_STATE_HEAD_AUTO:
 			(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from head at id switch",
 						     M_NOWAIT, false);
 			break;
 		case TCP_LOG_STATE_TAIL_AUTO:
 			(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from tail at id switch",
 						     M_NOWAIT, false);
 			break;
 		case TCP_LOG_STATE_CONTINUAL:
 			(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from continual at id switch",
 						     M_NOWAIT, false);
 			break;
 		case TCP_LOG_VIA_BBPOINTS:
 			(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from bbpoints at id switch",
 						     M_NOWAIT, false);
 			break;
 		}
 	}
 	if (same) {
 		if (tp->t_lib != NULL) {
 			tcp_log_increment_reqcnt(tp->t_lib);
 			if ((tp->t_lib->tlb_logstate > TCP_LOG_STATE_OFF) &&
 			    (tp->t_log_state_set == 0)) {
 				/* Clone in any logging */
 
 				tp->_t_logstate = tp->t_lib->tlb_logstate;
 			}
 			if ((tp->t_lib->tlb_loglimit) &&
 			    (tp->t_log_state_set == 0)) {
 				/* We also have a limit set */
 
 				tp->t_loglimit = tp->t_lib->tlb_loglimit;
 			}
 		}
 		rv = 0;
 		goto done;
 	}
 
 	/*
 	 * If the TCPCB had a previous ID, we need to extricate it from
 	 * the previous list.
 	 *
 	 * Drop the TCPCB lock and lock the tree and the bucket.
 	 * Because this is called in the socket context, we (theoretically)
 	 * don't need to worry about the INPCB completely going away
 	 * while we are gone.
 	 */
 	if (tp->t_lib != NULL) {
 		tlb = tp->t_lib;
 		TCPID_BUCKET_REF(tlb);
 		INP_WUNLOCK(inp);
 
 		if (tree_locked == TREE_UNLOCKED) {
 			TCPID_TREE_RLOCK();
 			tree_locked = TREE_RLOCKED;
 		}
 		TCPID_BUCKET_LOCK(tlb);
 		bucket_locked = true;
 		INP_WLOCK(inp);
 
 		/*
 		 * Unreference the bucket. If our bucket went away, it is no
 		 * longer locked or valid.
 		 */
 		if (tcp_log_unref_bucket(tlb, &tree_locked, inp)) {
 			bucket_locked = false;
 			tlb = NULL;
 		}
 
 		/* Validate the INP. */
 		RECHECK_INP();
 
 		/*
 		 * Evaluate whether the bucket changed while we were unlocked.
 		 *
 		 * Possible scenarios here:
 		 * 1. Bucket is unchanged and the same one we started with.
 		 * 2. The TCPCB no longer has a bucket and our bucket was
 		 *    freed.
 		 * 3. The TCPCB has a new bucket, whether ours was freed.
 		 * 4. The TCPCB no longer has a bucket and our bucket was
 		 *    not freed.
 		 *
 		 * In cases 2-4, we will start over. In case 1, we will
 		 * proceed here to remove the bucket.
 		 */
 		if (tlb == NULL || tp->t_lib != tlb) {
 			KASSERT(bucket_locked || tlb == NULL,
 			    ("%s: bucket_locked (%d) and tlb (%p) are "
 			    "inconsistent", __func__, bucket_locked, tlb));
 
 			if (bucket_locked) {
 				TCPID_BUCKET_UNLOCK(tlb);
 				bucket_locked = false;
 				tlb = NULL;
 			}
 			goto restart;
 		}
 
 		/*
 		 * Store the (struct tcp_log_id_node) for reuse. Then, remove
 		 * it from the bucket. In the process, we may end up relocking.
 		 * If so, we need to validate that the INP is still valid, and
 		 * the TCPCB entries match we expect.
 		 *
 		 * We will clear tlb and change the bucket_locked state just
 		 * before calling tcp_log_remove_id_node(), since that function
 		 * will unlock the bucket.
 		 */
 		if (tln != NULL)
 			uma_zfree(tcp_log_id_node_zone, tln);
 		tln = tp->t_lin;
 		tlb = NULL;
 		bucket_locked = false;
 		if (tcp_log_remove_id_node(inp, tp, NULL, NULL, &tree_locked)) {
 			RECHECK_INP();
 
 			/*
 			 * If the TCPCB moved to a new bucket while we had
 			 * dropped the lock, restart.
 			 */
 			if (tp->t_lib != NULL || tp->t_lin != NULL)
 				goto restart;
 		}
 
 		/*
 		 * Yay! We successfully removed the TCPCB from its old
 		 * bucket. Phew!
 		 *
 		 * On to bigger and better things...
 		 */
 	}
 
 	/* At this point, the TCPCB should not be in any bucket. */
 	KASSERT(tp->t_lib == NULL, ("%s: tp->t_lib is not NULL", __func__));
 
 	/*
 	 * If the new ID is not empty, we need to now assign this TCPCB to a
 	 * new bucket.
 	 */
 	if (*id) {
 		/* Get a new tln, if we don't already have one to reuse. */
 		if (tln == NULL) {
 			tln = uma_zalloc(tcp_log_id_node_zone,
 				M_NOWAIT | M_ZERO);
 			if (tln == NULL) {
 				rv = ENOBUFS;
 				goto done;
 			}
 			tln->tln_inp = inp;
 			tln->tln_tp = tp;
 		}
 
 		/*
 		 * Drop the INP lock for a bit. We don't need it, and dropping
 		 * it prevents lock order reversals.
 		 */
 		INP_WUNLOCK(inp);
 
 		/* Make sure we have at least a read lock on the tree. */
 		tcp_log_id_validate_tree_lock(tree_locked);
 		if (tree_locked == TREE_UNLOCKED) {
 			TCPID_TREE_RLOCK();
 			tree_locked = TREE_RLOCKED;
 		}
 
 refind:
 		/*
 		 * Remember that we constructed (struct tcp_log_id_node) so
 		 * we can safely cast the id to it for the purposes of finding.
 		 */
 		KASSERT(tlb == NULL, ("%s:%d tlb unexpectedly non-NULL",
 		    __func__, __LINE__));
 		tmp_tlb = RB_FIND(tcp_log_id_tree, &tcp_log_id_head,
 		    (struct tcp_log_id_bucket *) id);
 
 		/*
 		 * If we didn't find a matching bucket, we need to add a new
 		 * one. This requires a write lock. But, of course, we will
 		 * need to recheck some things when we re-acquire the lock.
 		 */
 		if (tmp_tlb == NULL && tree_locked != TREE_WLOCKED) {
 			tree_locked = TREE_WLOCKED;
 			if (!TCPID_TREE_UPGRADE()) {
 				TCPID_TREE_RUNLOCK();
 				TCPID_TREE_WLOCK();
 
 				/*
 				 * The tree may have changed while we were
 				 * unlocked.
 				 */
 				goto refind;
 			}
 		}
 
 		/* If we need to add a new bucket, do it now. */
 		if (tmp_tlb == NULL) {
 			/* Allocate new bucket. */
 			tlb = uma_zalloc(tcp_log_id_bucket_zone, M_NOWAIT);
 			if (tlb == NULL) {
 				rv = ENOBUFS;
 				goto done_noinp;
 			}
 			counter_u64_add(tcp_log_pcb_ids_cur, 1);
 			counter_u64_add(tcp_log_pcb_ids_tot, 1);
 
 			if ((tcp_log_auto_all == false) &&
 			    tcp_log_auto_mode &&
 			    tcp_log_selectauto()) {
 				/* Save off the log state */
 				tlb->tlb_logstate = tcp_log_auto_mode;
 			} else
 				tlb->tlb_logstate = TCP_LOG_STATE_OFF;
 			tlb->tlb_loglimit = 0;
 			tlb->tlb_tag[0] = '\0'; /* Default to an empty tag. */
 
 			/*
 			 * Copy the ID to the bucket.
 			 * NB: Don't use strlcpy() unless you are sure
 			 * we've always validated NULL termination.
 			 *
 			 * TODO: When I'm done writing this, see if we
 			 * we have correctly validated NULL termination and
 			 * can use strlcpy(). :-)
 			 */
 			strncpy(tlb->tlb_id, id, TCP_LOG_ID_LEN - 1);
 			tlb->tlb_id[TCP_LOG_ID_LEN - 1] = '\0';
 
 			/*
 			 * Take the refcount for the first node and go ahead
 			 * and lock this. Note that we zero the tlb_mtx
 			 * structure, since 0xdeadc0de flips the right bits
 			 * for the code to think that this mutex has already
 			 * been initialized. :-(
 			 */
 			SLIST_INIT(&tlb->tlb_head);
 			refcount_init(&tlb->tlb_refcnt, 1);
 			tlb->tlb_reqcnt = 1;
 			memset(&tlb->tlb_mtx, 0, sizeof(struct mtx));
 			TCPID_BUCKET_LOCK_INIT(tlb);
 			TCPID_BUCKET_LOCK(tlb);
 			bucket_locked = true;
 
 #define	FREE_NEW_TLB()	do {				\
 	TCPID_BUCKET_LOCK_DESTROY(tlb);			\
 	uma_zfree(tcp_log_id_bucket_zone, tlb);		\
 	counter_u64_add(tcp_log_pcb_ids_cur, (int64_t)-1);	\
 	counter_u64_add(tcp_log_pcb_ids_tot, (int64_t)-1);	\
 	bucket_locked = false;				\
 	tlb = NULL;					\
 } while (0)
 			/*
 			 * Relock the INP and make sure we are still
 			 * unassigned.
 			 */
 			INP_WLOCK(inp);
 			RECHECK_INP_CLEAN(FREE_NEW_TLB());
 			if (tp->t_lib != NULL) {
 				FREE_NEW_TLB();
 				goto restart;
 			}
 
 			/* Add the new bucket to the tree. */
 			tmp_tlb = RB_INSERT(tcp_log_id_tree, &tcp_log_id_head,
 			    tlb);
 			KASSERT(tmp_tlb == NULL,
 			    ("%s: Unexpected conflicting bucket (%p) while "
 			    "adding new bucket (%p)", __func__, tmp_tlb, tlb));
 
 			/*
 			 * If we found a conflicting bucket, free the new
 			 * one we made and fall through to use the existing
 			 * bucket.
 			 */
 			if (tmp_tlb != NULL) {
 				FREE_NEW_TLB();
 				INP_WUNLOCK(inp);
 			}
 #undef	FREE_NEW_TLB
 		}
 
 		/* If we found an existing bucket, use it. */
 		if (tmp_tlb != NULL) {
 			tlb = tmp_tlb;
 			TCPID_BUCKET_LOCK(tlb);
 			bucket_locked = true;
 
 			/*
 			 * Relock the INP and make sure we are still
 			 * unassigned.
 			 */
 			INP_UNLOCK_ASSERT(inp);
 			INP_WLOCK(inp);
 			RECHECK_INP();
 			if (tp->t_lib != NULL) {
 				TCPID_BUCKET_UNLOCK(tlb);
 				bucket_locked = false;
 				tlb = NULL;
 				goto restart;
 			}
 
 			/* Take a reference on the bucket. */
 			TCPID_BUCKET_REF(tlb);
 
 			/* Record the request. */
 			tcp_log_increment_reqcnt(tlb);
 		}
 
 		tcp_log_grow_tlb(tlb->tlb_id, tp);
 
 		/* Add the new node to the list. */
 		SLIST_INSERT_HEAD(&tlb->tlb_head, tln, tln_list);
 		tp->t_lib = tlb;
 		tp->t_lin = tln;
 		if (tp->t_lib->tlb_logstate > TCP_LOG_STATE_OFF) {
 			/* Clone in any logging */
 
 			tp->_t_logstate = tp->t_lib->tlb_logstate;
 		}
 		if (tp->t_lib->tlb_loglimit) {
 			/* The loglimit too */
 
 			tp->t_loglimit = tp->t_lib->tlb_loglimit;
 		}
 		tln = NULL;
 	}
 
 	rv = 0;
 
 done:
 	/* Unlock things, as needed, and return. */
 	INP_WUNLOCK(inp);
 done_noinp:
 	INP_UNLOCK_ASSERT(inp);
 	if (bucket_locked) {
 		TCPID_BUCKET_LOCK_ASSERT(tlb);
 		TCPID_BUCKET_UNLOCK(tlb);
 	} else if (tlb != NULL)
 		TCPID_BUCKET_UNLOCK_ASSERT(tlb);
 	if (tree_locked == TREE_WLOCKED) {
 		TCPID_TREE_WLOCK_ASSERT();
 		TCPID_TREE_WUNLOCK();
 	} else if (tree_locked == TREE_RLOCKED) {
 		TCPID_TREE_RLOCK_ASSERT();
 		TCPID_TREE_RUNLOCK();
 	} else
 		TCPID_TREE_UNLOCK_ASSERT();
 	if (tln != NULL)
 		uma_zfree(tcp_log_id_node_zone, tln);
 	return (rv);
 }
 
 /*
  * Get the TCP log ID for a TCPCB.
  * Called with INPCB locked.
  * 'buf' must point to a buffer that is at least TCP_LOG_ID_LEN bytes long.
  * Returns number of bytes copied.
  */
 size_t
 tcp_log_get_id(struct tcpcb *tp, char *buf)
 {
 	size_t len;
 
 	INP_LOCK_ASSERT(tptoinpcb(tp));
 	if (tp->t_lib != NULL) {
 		len = strlcpy(buf, tp->t_lib->tlb_id, TCP_LOG_ID_LEN);
 		KASSERT(len < TCP_LOG_ID_LEN,
 		    ("%s:%d: tp->t_lib->tlb_id too long (%zu)",
 		    __func__, __LINE__, len));
 	} else {
 		*buf = '\0';
 		len = 0;
 	}
 	return (len);
 }
 
 /*
  * Get the tag associated with the TCPCB's log ID.
  * Called with INPCB locked. Returns with it unlocked.
  * 'buf' must point to a buffer that is at least TCP_LOG_TAG_LEN bytes long.
  * Returns number of bytes copied.
  */
 size_t
 tcp_log_get_tag(struct tcpcb *tp, char *buf)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_log_id_bucket *tlb;
 	size_t len;
 	int tree_locked;
 
 	INP_WLOCK_ASSERT(inp);
 
 	tree_locked = TREE_UNLOCKED;
 	tlb = tp->t_lib;
 
 	if (tlb != NULL) {
 		TCPID_BUCKET_REF(tlb);
 		INP_WUNLOCK(inp);
 		TCPID_BUCKET_LOCK(tlb);
 		len = strlcpy(buf, tlb->tlb_tag, TCP_LOG_TAG_LEN);
 		KASSERT(len < TCP_LOG_TAG_LEN,
 		    ("%s:%d: tp->t_lib->tlb_tag too long (%zu)",
 		    __func__, __LINE__, len));
 		if (!tcp_log_unref_bucket(tlb, &tree_locked, NULL))
 			TCPID_BUCKET_UNLOCK(tlb);
 
 		if (tree_locked == TREE_WLOCKED) {
 			TCPID_TREE_WLOCK_ASSERT();
 			TCPID_TREE_WUNLOCK();
 		} else if (tree_locked == TREE_RLOCKED) {
 			TCPID_TREE_RLOCK_ASSERT();
 			TCPID_TREE_RUNLOCK();
 		} else
 			TCPID_TREE_UNLOCK_ASSERT();
 	} else {
 		INP_WUNLOCK(inp);
 		*buf = '\0';
 		len = 0;
 	}
 
 	return (len);
 }
 
 /*
  * Get number of connections with the same log ID.
  * Log ID is taken from given TCPCB.
  * Called with INPCB locked.
  */
 u_int
 tcp_log_get_id_cnt(struct tcpcb *tp)
 {
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	return ((tp->t_lib == NULL) ? 0 : tp->t_lib->tlb_refcnt);
 }
 
 #ifdef TCPLOG_DEBUG_RINGBUF
 /*
  * Functions/macros to increment/decrement reference count for a log
  * entry. This should catch when we do a double-free/double-remove or
  * a double-add.
  */
 static inline void
 _tcp_log_entry_refcnt_add(struct tcp_log_mem *log_entry, const char *func,
     int line)
 {
 	int refcnt;
 
 	refcnt = atomic_fetchadd_int(&log_entry->tlm_refcnt, 1);
 	if (refcnt != 0)
 		panic("%s:%d: log_entry(%p)->tlm_refcnt is %d (expected 0)",
 		    func, line, log_entry, refcnt);
 }
 #define	tcp_log_entry_refcnt_add(l)	\
     _tcp_log_entry_refcnt_add((l), __func__, __LINE__)
 
 static inline void
 _tcp_log_entry_refcnt_rem(struct tcp_log_mem *log_entry, const char *func,
     int line)
 {
 	int refcnt;
 
 	refcnt = atomic_fetchadd_int(&log_entry->tlm_refcnt, -1);
 	if (refcnt != 1)
 		panic("%s:%d: log_entry(%p)->tlm_refcnt is %d (expected 1)",
 		    func, line, log_entry, refcnt);
 }
 #define	tcp_log_entry_refcnt_rem(l)	\
     _tcp_log_entry_refcnt_rem((l), __func__, __LINE__)
 
 #else /* !TCPLOG_DEBUG_RINGBUF */
 
 #define	tcp_log_entry_refcnt_add(l)
 #define	tcp_log_entry_refcnt_rem(l)
 
 #endif
 
 /*
  * Cleanup after removing a log entry, but only decrement the count if we
  * are running INVARIANTS.
  */
 static inline void
 tcp_log_free_log_common(struct tcp_log_mem *log_entry, int *count __unused)
 {
 
 	uma_zfree(tcp_log_zone, log_entry);
 #ifdef INVARIANTS
 	(*count)--;
 	KASSERT(*count >= 0,
 	    ("%s: count unexpectedly negative", __func__));
 #endif
 }
 
 static void
 tcp_log_free_entries(struct tcp_log_stailq *head, int *count)
 {
 	struct tcp_log_mem *log_entry;
 
 	/* Free the entries. */
 	while ((log_entry = STAILQ_FIRST(head)) != NULL) {
 		STAILQ_REMOVE_HEAD(head, tlm_queue);
 		tcp_log_entry_refcnt_rem(log_entry);
 		tcp_log_free_log_common(log_entry, count);
 	}
 }
 
 /* Cleanup after removing a log entry. */
 static inline void
 tcp_log_remove_log_cleanup(struct tcpcb *tp, struct tcp_log_mem *log_entry)
 {
 	uma_zfree(tcp_log_zone, log_entry);
 	tp->t_lognum--;
 	KASSERT(tp->t_lognum >= 0,
 	    ("%s: tp->t_lognum unexpectedly negative", __func__));
 }
 
 /* Remove a log entry from the head of a list. */
 static inline void
 tcp_log_remove_log_head(struct tcpcb *tp, struct tcp_log_mem *log_entry)
 {
 
 	KASSERT(log_entry == STAILQ_FIRST(&tp->t_logs),
 	    ("%s: attempt to remove non-HEAD log entry", __func__));
 	STAILQ_REMOVE_HEAD(&tp->t_logs, tlm_queue);
 	tcp_log_entry_refcnt_rem(log_entry);
 	tcp_log_remove_log_cleanup(tp, log_entry);
 }
 
 #ifdef TCPLOG_DEBUG_RINGBUF
 /*
  * Initialize the log entry's reference count, which we want to
  * survive allocations.
  */
 static int
 tcp_log_zone_init(void *mem, int size, int flags __unused)
 {
 	struct tcp_log_mem *tlm;
 
 	KASSERT(size >= sizeof(struct tcp_log_mem),
 	    ("%s: unexpectedly short (%d) allocation", __func__, size));
 	tlm = (struct tcp_log_mem *)mem;
 	tlm->tlm_refcnt = 0;
 	return (0);
 }
 
 /*
  * Double check that the refcnt is zero on allocation and return.
  */
 static int
 tcp_log_zone_ctor(void *mem, int size, void *args __unused, int flags __unused)
 {
 	struct tcp_log_mem *tlm;
 
 	KASSERT(size >= sizeof(struct tcp_log_mem),
 	    ("%s: unexpectedly short (%d) allocation", __func__, size));
 	tlm = (struct tcp_log_mem *)mem;
 	if (tlm->tlm_refcnt != 0)
 		panic("%s:%d: tlm(%p)->tlm_refcnt is %d (expected 0)",
 		    __func__, __LINE__, tlm, tlm->tlm_refcnt);
 	return (0);
 }
 
 static void
 tcp_log_zone_dtor(void *mem, int size, void *args __unused)
 {
 	struct tcp_log_mem *tlm;
 
 	KASSERT(size >= sizeof(struct tcp_log_mem),
 	    ("%s: unexpectedly short (%d) allocation", __func__, size));
 	tlm = (struct tcp_log_mem *)mem;
 	if (tlm->tlm_refcnt != 0)
 		panic("%s:%d: tlm(%p)->tlm_refcnt is %d (expected 0)",
 		    __func__, __LINE__, tlm, tlm->tlm_refcnt);
 }
 #endif /* TCPLOG_DEBUG_RINGBUF */
 
 /* Do global initialization. */
 void
 tcp_log_init(void)
 {
 
 	tcp_log_zone = uma_zcreate("tcp_log", sizeof(struct tcp_log_mem),
 #ifdef TCPLOG_DEBUG_RINGBUF
 	    tcp_log_zone_ctor, tcp_log_zone_dtor, tcp_log_zone_init,
 #else
 	    NULL, NULL, NULL,
 #endif
 	    NULL, UMA_ALIGN_PTR, 0);
 	(void)uma_zone_set_max(tcp_log_zone, TCP_LOG_BUF_DEFAULT_GLOBAL_LIMIT);
 	tcp_log_id_bucket_zone = uma_zcreate("tcp_log_id_bucket",
 	    sizeof(struct tcp_log_id_bucket), NULL, NULL, NULL, NULL,
 	    UMA_ALIGN_PTR, 0);
 	tcp_log_id_node_zone = uma_zcreate("tcp_log_id_node",
 	    sizeof(struct tcp_log_id_node), NULL, NULL, NULL, NULL,
 	    UMA_ALIGN_PTR, 0);
 #ifdef TCPLOG_DEBUG_COUNTERS
 	tcp_log_queued = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_fail1 = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_fail2 = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_fail3 = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_fail4 = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_fail5 = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_copyout = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_read = counter_u64_alloc(M_WAITOK);
 	tcp_log_que_freed = counter_u64_alloc(M_WAITOK);
 #endif
 	tcp_log_pcb_ids_cur = counter_u64_alloc(M_WAITOK);
 	tcp_log_pcb_ids_tot = counter_u64_alloc(M_WAITOK);
 
 	rw_init_flags(&tcp_id_tree_lock, "TCP ID tree", RW_NEW);
 	mtx_init(&tcp_log_expireq_mtx, "TCP log expireq", NULL, MTX_DEF);
 	callout_init(&tcp_log_expireq_callout, 1);
 }
 
 /* Do per-TCPCB initialization. */
 void
 tcp_log_tcpcbinit(struct tcpcb *tp)
 {
 
 	/* A new TCPCB should start out zero-initialized. */
 	STAILQ_INIT(&tp->t_logs);
 
 	/*
 	 * If we are doing auto-capturing, figure out whether we will capture
 	 * this session.
 	 */
 	tp->t_loglimit = tcp_log_session_limit;
 	if ((tcp_log_auto_all == true) &&
 	    tcp_log_auto_mode &&
 	    tcp_log_selectauto()) {
 		tp->_t_logstate = tcp_log_auto_mode;
 		tp->t_flags2 |= TF2_LOG_AUTO;
 	}
 }
 
 /* Remove entries */
 static void
 tcp_log_expire(void *unused __unused)
 {
 	struct tcp_log_id_bucket *tlb;
 	struct tcp_log_id_node *tln;
 	sbintime_t expiry_limit;
 	int tree_locked;
 
 	TCPLOG_EXPIREQ_LOCK();
 	if (callout_pending(&tcp_log_expireq_callout)) {
 		/* Callout was reset. */
 		TCPLOG_EXPIREQ_UNLOCK();
 		return;
 	}
 
 	/*
 	 * Process entries until we reach one that expires too far in the
 	 * future. Look one second in the future.
 	 */
 	expiry_limit = getsbinuptime() + SBT_1S;
 	tree_locked = TREE_UNLOCKED;
 
 	while ((tln = STAILQ_FIRST(&tcp_log_expireq_head)) != NULL &&
 	    tln->tln_expiretime <= expiry_limit) {
 		if (!callout_active(&tcp_log_expireq_callout)) {
 			/*
 			 * Callout was stopped. I guess we should
 			 * just quit at this point.
 			 */
 			TCPLOG_EXPIREQ_UNLOCK();
 			return;
 		}
 
 		/*
 		 * Remove the node from the head of the list and unlock
 		 * the list. Change the expiry time to SBT_MAX as a signal
 		 * to other threads that we now own this.
 		 */
 		STAILQ_REMOVE_HEAD(&tcp_log_expireq_head, tln_expireq);
 		tln->tln_expiretime = SBT_MAX;
 		TCPLOG_EXPIREQ_UNLOCK();
 
 		/*
 		 * Remove the node from the bucket.
 		 */
 		tlb = tln->tln_bucket;
 		TCPID_BUCKET_LOCK(tlb);
 		if (tcp_log_remove_id_node(NULL, NULL, tlb, tln, &tree_locked)) {
 			tcp_log_id_validate_tree_lock(tree_locked);
 			if (tree_locked == TREE_WLOCKED)
 				TCPID_TREE_WUNLOCK();
 			else
 				TCPID_TREE_RUNLOCK();
 			tree_locked = TREE_UNLOCKED;
 		}
 
 		/* Drop the INP reference. */
 		INP_WLOCK(tln->tln_inp);
 		if (!in_pcbrele_wlocked(tln->tln_inp))
 			INP_WUNLOCK(tln->tln_inp);
 
 		/* Free the log records. */
 		tcp_log_free_entries(&tln->tln_entries, &tln->tln_count);
 
 		/* Free the node. */
 		uma_zfree(tcp_log_id_node_zone, tln);
 
 		/* Relock the expiry queue. */
 		TCPLOG_EXPIREQ_LOCK();
 	}
 
 	/*
 	 * We've expired all the entries we can. Do we need to reschedule
 	 * ourselves?
 	 */
 	callout_deactivate(&tcp_log_expireq_callout);
 	if (tln != NULL) {
 		/*
 		 * Get max(now + TCP_LOG_EXPIRE_INTVL, tln->tln_expiretime) and
 		 * set the next callout to that. (This helps ensure we generally
 		 * run the callout no more often than desired.)
 		 */
 		expiry_limit = getsbinuptime() + TCP_LOG_EXPIRE_INTVL;
 		if (expiry_limit < tln->tln_expiretime)
 			expiry_limit = tln->tln_expiretime;
 		callout_reset_sbt(&tcp_log_expireq_callout, expiry_limit,
 		    SBT_1S, tcp_log_expire, NULL, C_ABSOLUTE);
 	}
 
 	/* We're done. */
 	TCPLOG_EXPIREQ_UNLOCK();
 	return;
 }
 
 /*
  * Move log data from the TCPCB to a new node. This will reset the TCPCB log
  * entries and log count; however, it will not touch other things from the
  * TCPCB (e.g. t_lin, t_lib).
  *
  * NOTE: Must hold a lock on the INP.
  */
 static void
 tcp_log_move_tp_to_node(struct tcpcb *tp, struct tcp_log_id_node *tln)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 
 	INP_WLOCK_ASSERT(inp);
 
 	tln->tln_ie = inp->inp_inc.inc_ie;
 	if (inp->inp_inc.inc_flags & INC_ISIPV6)
 		tln->tln_af = AF_INET6;
 	else
 		tln->tln_af = AF_INET;
 	tln->tln_entries = tp->t_logs;
 	tln->tln_count = tp->t_lognum;
 	tln->tln_bucket = tp->t_lib;
 
 	/* Clear information from the PCB. */
 	STAILQ_INIT(&tp->t_logs);
 	tp->t_lognum = 0;
 }
 
 /* Do per-TCPCB cleanup */
 void
 tcp_log_tcpcbfini(struct tcpcb *tp)
 {
 	struct tcp_log_id_node *tln, *tln_first;
 	struct tcp_log_mem *log_entry;
 	sbintime_t callouttime;
 
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (tp->_t_logstate) {
 		union tcp_log_stackspecific log;
 		struct timeval tv;
 #ifdef TCP_ACCOUNTING
 		struct tcp_log_buffer *lgb;
 		int i;
 
 		memset(&log, 0, sizeof(log));
 		if (tp->t_flags2 & TF2_TCP_ACCOUNTING) {
 			for (i = 0; i < TCP_NUM_CNT_COUNTERS; i++) {
 				log.u_raw.u64_flex[i] = tp->tcp_cnt_counters[i];
 			}
 			lgb = tcp_log_event(tp, NULL,
 				  NULL,
 				  NULL,
 				  TCP_LOG_ACCOUNTING, 0,
 				  0, &log, false, NULL, NULL, 0, &tv);
 			if (lgb != NULL) {
 				lgb->tlb_flex1 = TCP_NUM_CNT_COUNTERS;
 				lgb->tlb_flex2 = 1;
 			} else
 				goto skip_out;
 			for (i = 0; i<TCP_NUM_CNT_COUNTERS; i++) {
 				log.u_raw.u64_flex[i] = tp->tcp_proc_time[i];
 			}
 			lgb = tcp_log_event(tp, NULL,
 				 NULL,
 				 NULL,
 				 TCP_LOG_ACCOUNTING, 0,
 				 0, &log, false, NULL, NULL, 0, &tv);
 			if (lgb != NULL) {
 				lgb->tlb_flex1 = TCP_NUM_CNT_COUNTERS;
 				lgb->tlb_flex2 = 2;
 			}
 		}
 skip_out:
 #endif
 		log.u_bbr.timeStamp = tcp_get_usecs(&tv);
 		log.u_bbr.cur_del_rate = tp->t_end_info;
 		(void)tcp_log_event(tp, NULL,
 	                 NULL,
 			 NULL,
 		         TCP_LOG_CONNEND, 0,
 		         0, &log, false, NULL, NULL, 0,  &tv);
 	}
 	/*
 	 * If we were gathering packets to be automatically dumped, try to do
 	 * it now. If this succeeds, the log information in the TCPCB will be
 	 * cleared. Otherwise, we'll handle the log information as we do
 	 * for other states.
 	 */
 	switch(tp->_t_logstate) {
 	case TCP_LOG_STATE_HEAD_AUTO:
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from head",
 		    M_NOWAIT, false);
 		break;
 	case TCP_LOG_STATE_TAIL_AUTO:
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from tail",
 		    M_NOWAIT, false);
 		break;
 	case TCP_LOG_VIA_BBPOINTS:
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from bbpoints",
 		    M_NOWAIT, false);
 		break;
 	case TCP_LOG_STATE_CONTINUAL:
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from continual",
 		    M_NOWAIT, false);
 		break;
 	}
 
 	/*
 	 * There are two ways we could keep logs: per-socket or per-ID. If
 	 * we are tracking logs with an ID, then the logs survive the
 	 * destruction of the TCPCB.
 	 *
 	 * If the TCPCB is associated with an ID node, move the logs from the
 	 * TCPCB to the ID node. In theory, this is safe, for reasons which I
 	 * will now explain for my own benefit when I next need to figure out
 	 * this code. :-)
 	 *
 	 * We own the INP lock. Therefore, no one else can change the contents
 	 * of this node (Rule C). Further, no one can remove this node from
 	 * the bucket while we hold the lock (Rule D). Basically, no one can
 	 * mess with this node. That leaves two states in which we could be:
 	 *
 	 * 1. Another thread is currently waiting to acquire the INP lock, with
 	 *    plans to do something with this node. When we drop the INP lock,
 	 *    they will have a chance to do that. They will recheck the
 	 *    tln_closed field (see note to Rule C) and then acquire the
 	 *    bucket lock before proceeding further.
 	 *
 	 * 2. Another thread will try to acquire a lock at some point in the
 	 *    future. If they try to acquire a lock before we set the
 	 *    tln_closed field, they will follow state #1. If they try to
 	 *    acquire a lock after we set the tln_closed field, they will be
 	 *    able to make changes to the node, at will, following Rule C.
 	 *
 	 * Therefore, we currently own this node and can make any changes
 	 * we want. But, as soon as we set the tln_closed field to true, we
 	 * have effectively dropped our lock on the node. (For this reason, we
 	 * also need to make sure our writes are ordered correctly. An atomic
 	 * operation with "release" semantics should be sufficient.)
 	 */
 
 	if (tp->t_lin != NULL) {
 		struct inpcb *inp = tptoinpcb(tp);
 
 		/* Copy the relevant information to the log entry. */
 		tln = tp->t_lin;
 		KASSERT(tln->tln_inp == inp,
 		    ("%s: Mismatched inp (tln->tln_inp=%p, tp inpcb=%p)",
 		    __func__, tln->tln_inp, inp));
 		tcp_log_move_tp_to_node(tp, tln);
 
 		/* Clear information from the PCB. */
 		tp->t_lin = NULL;
 		tp->t_lib = NULL;
 
 		/*
 		 * Take a reference on the INP. This ensures that the INP
 		 * remains valid while the node is on the expiry queue. This
 		 * ensures the INP is valid for other threads that may be
 		 * racing to lock this node when we move it to the expire
 		 * queue.
 		 */
 		in_pcbref(inp);
 
 		/*
 		 * Store the entry on the expiry list. The exact behavior
 		 * depends on whether we have entries to keep. If so, we
 		 * put the entry at the tail of the list and expire in
 		 * TCP_LOG_EXPIRE_TIME. Otherwise, we expire "now" and put
 		 * the entry at the head of the list. (Handling the cleanup
 		 * via the expiry timer lets us avoid locking messy-ness here.)
 		 */
 		tln->tln_expiretime = getsbinuptime();
 		TCPLOG_EXPIREQ_LOCK();
 		if (tln->tln_count) {
 			tln->tln_expiretime += TCP_LOG_EXPIRE_TIME;
 			if (STAILQ_EMPTY(&tcp_log_expireq_head) &&
 			    !callout_active(&tcp_log_expireq_callout)) {
 				/*
 				 * We are adding the first entry and a callout
 				 * is not currently scheduled; therefore, we
 				 * need to schedule one.
 				 */
 				callout_reset_sbt(&tcp_log_expireq_callout,
 				    tln->tln_expiretime, SBT_1S, tcp_log_expire,
 				    NULL, C_ABSOLUTE);
 			}
 			STAILQ_INSERT_TAIL(&tcp_log_expireq_head, tln,
 			    tln_expireq);
 		} else {
 			callouttime = tln->tln_expiretime +
 			    TCP_LOG_EXPIRE_INTVL;
 			tln_first = STAILQ_FIRST(&tcp_log_expireq_head);
 
 			if ((tln_first == NULL ||
 			    callouttime < tln_first->tln_expiretime) &&
 			    (callout_pending(&tcp_log_expireq_callout) ||
 			    !callout_active(&tcp_log_expireq_callout))) {
 				/*
 				 * The list is empty, or we want to run the
 				 * expire code before the first entry's timer
 				 * fires. Also, we are in a case where a callout
 				 * is not actively running. We want to reset
 				 * the callout to occur sooner.
 				 */
 				callout_reset_sbt(&tcp_log_expireq_callout,
 				    callouttime, SBT_1S, tcp_log_expire, NULL,
 				    C_ABSOLUTE);
 			}
 
 			/*
 			 * Insert to the head, or just after the head, as
 			 * appropriate. (This might result in small
 			 * mis-orderings as a bunch of "expire now" entries
 			 * gather at the start of the list, but that should
 			 * not produce big problems, since the expire timer
 			 * will walk through all of them.)
 			 */
 			if (tln_first == NULL ||
 			    tln->tln_expiretime < tln_first->tln_expiretime)
 				STAILQ_INSERT_HEAD(&tcp_log_expireq_head, tln,
 				    tln_expireq);
 			else
 				STAILQ_INSERT_AFTER(&tcp_log_expireq_head,
 				    tln_first, tln, tln_expireq);
 		}
 		TCPLOG_EXPIREQ_UNLOCK();
 
 		/*
 		 * We are done messing with the tln. After this point, we
 		 * can't touch it. (Note that the "release" semantics should
 		 * be included with the TCPLOG_EXPIREQ_UNLOCK() call above.
 		 * Therefore, they should be unnecessary here. However, it
 		 * seems like a good idea to include them anyway, since we
 		 * really are releasing a lock here.)
 		 */
 		atomic_store_rel_int(&tln->tln_closed, 1);
 	} else {
 		/* Remove log entries. */
 		while ((log_entry = STAILQ_FIRST(&tp->t_logs)) != NULL)
 			tcp_log_remove_log_head(tp, log_entry);
 		KASSERT(tp->t_lognum == 0,
 		    ("%s: After freeing entries, tp->t_lognum=%d (expected 0)",
 			__func__, tp->t_lognum));
 	}
 
 	/*
 	 * Change the log state to off (just in case anything tries to sneak
 	 * in a last-minute log).
 	 */
 	tp->_t_logstate = TCP_LOG_STATE_OFF;
 }
 
 static void
 tcp_log_purge_tp_logbuf(struct tcpcb *tp)
 {
 	struct tcp_log_mem *log_entry;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (tp->t_lognum == 0)
 		return;
 
 	while ((log_entry = STAILQ_FIRST(&tp->t_logs)) != NULL)
 		tcp_log_remove_log_head(tp, log_entry);
 	KASSERT(tp->t_lognum == 0,
 		("%s: After freeing entries, tp->t_lognum=%d (expected 0)",
 		 __func__, tp->t_lognum));
 	tp->_t_logstate = TCP_LOG_STATE_OFF;
 }
 
 /*
  * This logs an event for a TCP socket. Normally, this is called via
  * TCP_LOG_EVENT or TCP_LOG_EVENT_VERBOSE. See the documentation for
  * TCP_LOG_EVENT().
  */
 
 struct tcp_log_buffer *
 tcp_log_event(struct tcpcb *tp, struct tcphdr *th, struct sockbuf *rxbuf,
     struct sockbuf *txbuf, uint8_t eventid, int errornum, uint32_t len,
     union tcp_log_stackspecific *stackinfo, int th_hostorder,
     const char *output_caller, const char *func, int line, const struct timeval *itv)
 {
 	struct tcp_log_mem *log_entry;
 	struct tcp_log_buffer *log_buf;
 	int attempt_count = 0;
 	struct tcp_log_verbose *log_verbose;
 	uint32_t logsn;
 
 	KASSERT((func == NULL && line == 0) || (func != NULL && line > 0),
 	    ("%s called with inconsistent func (%p) and line (%d) arguments",
 		__func__, func, line));
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (tcp_disable_all_bb_logs) {
 		/*
 		 * The global shutdown logging
 		 * switch has been thrown. Call
 		 * the purge function that frees
 		 * purges out the logs and
 		 * turns off logging.
 		 */
 		tcp_log_purge_tp_logbuf(tp);
 		return (NULL);
 	}
 	KASSERT(tp->_t_logstate == TCP_LOG_STATE_HEAD ||
 	    tp->_t_logstate == TCP_LOG_STATE_TAIL ||
 	    tp->_t_logstate == TCP_LOG_STATE_CONTINUAL ||
 	    tp->_t_logstate == TCP_LOG_STATE_HEAD_AUTO ||
 	    tp->_t_logstate == TCP_LOG_VIA_BBPOINTS ||
 	    tp->_t_logstate == TCP_LOG_STATE_TAIL_AUTO,
 	    ("%s called with unexpected tp->_t_logstate (%d)", __func__,
 		tp->_t_logstate));
 
 	/*
 	 * Get the serial number. We do this early so it will
 	 * increment even if we end up skipping the log entry for some
 	 * reason.
 	 */
 	logsn = tp->t_logsn++;
 
 	/*
 	 * Can we get a new log entry? If so, increment the lognum counter
 	 * here.
 	 */
 retry:
 	if (tp->t_lognum < tp->t_loglimit) {
 		if ((log_entry = uma_zalloc(tcp_log_zone, M_NOWAIT)) != NULL)
 			tp->t_lognum++;
 	} else
 		log_entry = NULL;
 
 	/* Do we need to try to reuse? */
 	if (log_entry == NULL) {
 		/*
 		 * Sacrifice auto-logged sessions without a log ID if
 		 * tcp_log_auto_all is false. (If they don't have a log
 		 * ID by now, it is probable that either they won't get one
 		 * or we are resource-constrained.)
 		 */
 		if (tp->t_lib == NULL && (tp->t_flags2 & TF2_LOG_AUTO) &&
 		    !tcp_log_auto_all) {
 			if (tcp_log_state_change(tp, TCP_LOG_STATE_CLEAR)) {
 #ifdef INVARIANTS
 				panic("%s:%d: tcp_log_state_change() failed "
 				    "to set tp %p to TCP_LOG_STATE_CLEAR",
 				    __func__, __LINE__, tp);
 #endif
 				tp->_t_logstate = TCP_LOG_STATE_OFF;
 			}
 			return (NULL);
 		}
 		/*
 		 * If we are in TCP_LOG_STATE_HEAD_AUTO state, try to dump
 		 * the buffers. If successful, deactivate tracing. Otherwise,
 		 * leave it active so we will retry.
 		 */
 		if (tp->_t_logstate == TCP_LOG_STATE_HEAD_AUTO &&
 		    !tcp_log_dump_tp_logbuf(tp, "auto-dumped from head",
 		    M_NOWAIT, false)) {
 			tp->_t_logstate = TCP_LOG_STATE_OFF;
 			return(NULL);
 		} else if ((tp->_t_logstate == TCP_LOG_STATE_CONTINUAL) &&
 		    !tcp_log_dump_tp_logbuf(tp, "auto-dumped from continual",
 		    M_NOWAIT, false)) {
 			if (attempt_count == 0) {
 				attempt_count++;
 				goto retry;
 			}
 #ifdef TCPLOG_DEBUG_COUNTERS
 			counter_u64_add(tcp_log_que_fail4, 1);
 #endif
 			return(NULL);
 
 		} else if ((tp->_t_logstate == TCP_LOG_VIA_BBPOINTS) &&
 		    !tcp_log_dump_tp_logbuf(tp, "auto-dumped from bbpoints",
 		    M_NOWAIT, false)) {
 			if (attempt_count == 0) {
 				attempt_count++;
 				goto retry;
 			}
 #ifdef TCPLOG_DEBUG_COUNTERS
 			counter_u64_add(tcp_log_que_fail4, 1);
 #endif
 			return(NULL);
 		} else if (tp->_t_logstate == TCP_LOG_STATE_HEAD_AUTO)
 			return(NULL);
 
 		/* If in HEAD state, just deactivate the tracing and return. */
 		if (tp->_t_logstate == TCP_LOG_STATE_HEAD) {
 			tp->_t_logstate = TCP_LOG_STATE_OFF;
 			return(NULL);
 		}
 		/*
 		 * Get a buffer to reuse. If that fails, just give up.
 		 * (We can't log anything without a buffer in which to
 		 * put it.)
 		 *
 		 * Note that we don't change the t_lognum counter
 		 * here. Because we are re-using the buffer, the total
 		 * number won't change.
 		 */
 		if ((log_entry = STAILQ_FIRST(&tp->t_logs)) == NULL)
 			return(NULL);
 		STAILQ_REMOVE_HEAD(&tp->t_logs, tlm_queue);
 		tcp_log_entry_refcnt_rem(log_entry);
 	}
 
 	KASSERT(log_entry != NULL,
 	    ("%s: log_entry unexpectedly NULL", __func__));
 
 	/* Extract the log buffer and verbose buffer pointers. */
 	log_buf = &log_entry->tlm_buf;
 	log_verbose = &log_entry->tlm_v;
 
 	/* Basic entries. */
 	if (itv == NULL)
 		microuptime(&log_buf->tlb_tv);
 	else
 		memcpy(&log_buf->tlb_tv, itv, sizeof(struct timeval));
 	log_buf->tlb_ticks = ticks;
 	log_buf->tlb_sn = logsn;
 	log_buf->tlb_stackid = tp->t_fb->tfb_id;
 	log_buf->tlb_eventid = eventid;
 	log_buf->tlb_eventflags = 0;
 	log_buf->tlb_errno = errornum;
 
 	/* Socket buffers */
 	if (rxbuf != NULL) {
 		log_buf->tlb_eventflags |= TLB_FLAG_RXBUF;
 		log_buf->tlb_rxbuf.tls_sb_acc = rxbuf->sb_acc;
 		log_buf->tlb_rxbuf.tls_sb_ccc = rxbuf->sb_ccc;
 		log_buf->tlb_rxbuf.tls_sb_spare = 0;
 	} else {
 		log_buf->tlb_rxbuf.tls_sb_acc = 0;
 		log_buf->tlb_rxbuf.tls_sb_ccc = 0;
 	}
 	if (txbuf != NULL) {
 		log_buf->tlb_eventflags |= TLB_FLAG_TXBUF;
 		log_buf->tlb_txbuf.tls_sb_acc = txbuf->sb_acc;
 		log_buf->tlb_txbuf.tls_sb_ccc = txbuf->sb_ccc;
 		log_buf->tlb_txbuf.tls_sb_spare = 0;
 	} else {
 		log_buf->tlb_txbuf.tls_sb_acc = 0;
 		log_buf->tlb_txbuf.tls_sb_ccc = 0;
 	}
 	/* Copy values from tp to the log entry. */
 #define	COPY_STAT(f)	log_buf->tlb_ ## f = tp->f
 #define	COPY_STAT_T(f)	log_buf->tlb_ ## f = tp->t_ ## f
 	COPY_STAT_T(state);
 	COPY_STAT_T(starttime);
 	COPY_STAT(iss);
 	COPY_STAT_T(flags);
 	COPY_STAT(snd_una);
 	COPY_STAT(snd_max);
 	COPY_STAT(snd_cwnd);
 	COPY_STAT(snd_nxt);
 	COPY_STAT(snd_recover);
 	COPY_STAT(snd_wnd);
 	COPY_STAT(snd_ssthresh);
 	COPY_STAT_T(srtt);
 	COPY_STAT_T(rttvar);
 	COPY_STAT(rcv_up);
 	COPY_STAT(rcv_adv);
 	COPY_STAT(rcv_nxt);
 	COPY_STAT(rcv_wnd);
 	COPY_STAT_T(dupacks);
 	COPY_STAT_T(segqlen);
 	COPY_STAT(snd_numholes);
 	COPY_STAT(snd_scale);
 	COPY_STAT(rcv_scale);
 	COPY_STAT_T(flags2);
 	COPY_STAT_T(fbyte_in);
 	COPY_STAT_T(fbyte_out);
 #undef COPY_STAT
 #undef COPY_STAT_T
 	/* Copy stack-specific info. */
 	if (stackinfo != NULL) {
 		memcpy(&log_buf->tlb_stackinfo, stackinfo,
 		    sizeof(log_buf->tlb_stackinfo));
 		log_buf->tlb_eventflags |= TLB_FLAG_STACKINFO;
 	}
 
 	/* The packet */
 	log_buf->tlb_len = len;
 	if (th) {
 		int optlen;
 
 		log_buf->tlb_eventflags |= TLB_FLAG_HDR;
 		log_buf->tlb_th = *th;
 		if (th_hostorder)
 			tcp_fields_to_net(&log_buf->tlb_th);
 		optlen = (th->th_off << 2) - sizeof (struct tcphdr);
 		if (optlen > 0)
 			memcpy(log_buf->tlb_opts, th + 1, optlen);
 	} else {
 		memset(&log_buf->tlb_th, 0, sizeof(*th));
 	}
 
 	/* Verbose information */
 	if (func != NULL) {
 		log_buf->tlb_eventflags |= TLB_FLAG_VERBOSE;
 		if (output_caller != NULL)
 			strlcpy(log_verbose->tlv_snd_frm, output_caller,
 			    TCP_FUNC_LEN);
 		else
 			*log_verbose->tlv_snd_frm = 0;
 		strlcpy(log_verbose->tlv_trace_func, func, TCP_FUNC_LEN);
 		log_verbose->tlv_trace_line = line;
 	}
 
 	/* Insert the new log at the tail. */
 	STAILQ_INSERT_TAIL(&tp->t_logs, log_entry, tlm_queue);
 	tcp_log_entry_refcnt_add(log_entry);
 	return (log_buf);
 }
 
 /*
  * Change the logging state for a TCPCB. Returns 0 on success or an
  * error code on failure.
  */
 int
 tcp_log_state_change(struct tcpcb *tp, int state)
 {
 	struct tcp_log_mem *log_entry;
 	int rv;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	rv = 0;
 	switch(state) {
 	case TCP_LOG_STATE_CLEAR:
 		while ((log_entry = STAILQ_FIRST(&tp->t_logs)) != NULL)
 			tcp_log_remove_log_head(tp, log_entry);
-		/* Fall through */
+		/* FALLTHROUGH */
 
 	case TCP_LOG_STATE_OFF:
 		tp->_t_logstate = TCP_LOG_STATE_OFF;
 		break;
 
 	case TCP_LOG_STATE_TAIL:
 	case TCP_LOG_STATE_HEAD:
 	case TCP_LOG_STATE_CONTINUAL:
 	case TCP_LOG_VIA_BBPOINTS:
 	case TCP_LOG_STATE_HEAD_AUTO:
 	case TCP_LOG_STATE_TAIL_AUTO:
 		/*
 		 * When the RATIO_OFF state is set for the bucket, the log ID
 		 * this tp is associated with has been probabilistically opted
 		 * out of logging per tcp_log_apply_ratio().
 		 */
 		if (tp->t_lib == NULL ||
 		    tp->t_lib->tlb_logstate != TCP_LOG_STATE_RATIO_OFF) {
 			tp->_t_logstate = state;
 		} else {
 			rv = ECANCELED;
 			tp->_t_logstate = TCP_LOG_STATE_OFF;
 		}
 		break;
 
 	default:
 		return (EINVAL);
 	}
 	if (tcp_disable_all_bb_logs) {
 		/* We are prohibited from doing any logs */
 		tp->_t_logstate = TCP_LOG_STATE_OFF;
 		rv = EBUSY;
 	}
 	tp->t_flags2 &= ~(TF2_LOG_AUTO);
 
 	return (rv);
 }
 
 /* If tcp_drain() is called, flush half the log entries. */
 void
 tcp_log_drain(struct tcpcb *tp)
 {
 	struct tcp_log_mem *log_entry, *next;
 	int target, skip;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if ((target = tp->t_lognum / 2) == 0)
 		return;
 
 	/*
 	 * XXXRRS: At this I don't think this is wise that
 	 * we do this. All that a drain call means is that
 	 * we are hitting one of the system mbuf limits. BB
 	 * logging, or freeing of them, will not create any
 	 * more mbufs and really has nothing to do with
 	 * the system running out of mbufs. For now I
 	 * am changing this to free any "AUTO" by dumping
 	 * them out. But this should either be changed
 	 * so that it gets called when we hit the BB limit
 	 * or it should just not get called (one of the two)
 	 * since I don't think the mbuf <-> BB log cleanup
 	 * is the right thing to do here.
 	 */
 	/*
 	 * If we are logging the "head" packets, we want to discard
 	 * from the tail of the queue. Otherwise, we want to discard
 	 * from the head.
 	 */
 	if (tp->_t_logstate == TCP_LOG_STATE_HEAD) {
 		skip = tp->t_lognum - target;
 		STAILQ_FOREACH(log_entry, &tp->t_logs, tlm_queue)
 			if (!--skip)
 				break;
 		KASSERT(log_entry != NULL,
 		    ("%s: skipped through all entries!", __func__));
 		if (log_entry == NULL)
 			return;
 		while ((next = STAILQ_NEXT(log_entry, tlm_queue)) != NULL) {
 			STAILQ_REMOVE_AFTER(&tp->t_logs, log_entry, tlm_queue);
 			tcp_log_entry_refcnt_rem(next);
 			tcp_log_remove_log_cleanup(tp, next);
 #ifdef INVARIANTS
 			target--;
 #endif
 		}
 		KASSERT(target == 0,
 		    ("%s: After removing from tail, target was %d", __func__,
 			target));
 	} else if (tp->_t_logstate == TCP_LOG_STATE_HEAD_AUTO) {
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from head at drain",
 		    M_NOWAIT, false);
 	} else if (tp->_t_logstate == TCP_LOG_STATE_TAIL_AUTO) {
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from tail at drain",
 		    M_NOWAIT, false);
 	} else if (tp->_t_logstate == TCP_LOG_VIA_BBPOINTS) {
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from bbpoints",
 		    M_NOWAIT, false);
 	} else if (tp->_t_logstate == TCP_LOG_STATE_CONTINUAL) {
 		(void)tcp_log_dump_tp_logbuf(tp, "auto-dumped from continual",
 		    M_NOWAIT, false);
 	} else {
 		while ((log_entry = STAILQ_FIRST(&tp->t_logs)) != NULL &&
 		    target--)
 			tcp_log_remove_log_head(tp, log_entry);
 		KASSERT(target <= 0,
 		    ("%s: After removing from head, target was %d", __func__,
 			target));
 		KASSERT(tp->t_lognum > 0,
 		    ("%s: After removing from head, tp->t_lognum was %d",
 			__func__, target));
 		KASSERT(log_entry != NULL,
 		    ("%s: After removing from head, the tailq was empty",
 			__func__));
 	}
 }
 
 static inline int
 tcp_log_copyout(struct sockopt *sopt, void *src, void *dst, size_t len)
 {
 
 	if (sopt->sopt_td != NULL)
 		return (copyout(src, dst, len));
 	bcopy(src, dst, len);
 	return (0);
 }
 
 static int
 tcp_log_logs_to_buf(struct sockopt *sopt, struct tcp_log_stailq *log_tailqp,
     struct tcp_log_buffer **end, int count)
 {
 	struct tcp_log_buffer *out_entry;
 	struct tcp_log_mem *log_entry;
 	size_t entrysize;
 	int error;
 #ifdef INVARIANTS
 	int orig_count = count;
 #endif
 
 	/* Copy the data out. */
 	error = 0;
 	out_entry = (struct tcp_log_buffer *) sopt->sopt_val;
 	STAILQ_FOREACH(log_entry, log_tailqp, tlm_queue) {
 		count--;
 		KASSERT(count >= 0,
 		    ("%s:%d: Exceeded expected count (%d) processing list %p",
 		    __func__, __LINE__, orig_count, log_tailqp));
 
 #ifdef TCPLOG_DEBUG_COUNTERS
 		counter_u64_add(tcp_log_que_copyout, 1);
 #endif
 
 		/*
 		 * Skip copying out the header if it isn't present.
 		 * Instead, copy out zeros (to ensure we don't leak info).
 		 * TODO: Make sure we truly do zero everything we don't
 		 * explicitly set.
 		 */
 		if (log_entry->tlm_buf.tlb_eventflags & TLB_FLAG_HDR)
 			entrysize = sizeof(struct tcp_log_buffer);
 		else
 			entrysize = offsetof(struct tcp_log_buffer, tlb_th);
 		error = tcp_log_copyout(sopt, &log_entry->tlm_buf, out_entry,
 		    entrysize);
 		if (error)
 			break;
 		if (!(log_entry->tlm_buf.tlb_eventflags & TLB_FLAG_HDR)) {
 			error = tcp_log_copyout(sopt, zerobuf,
 			    ((uint8_t *)out_entry) + entrysize,
 			    sizeof(struct tcp_log_buffer) - entrysize);
 		}
 
 		/*
 		 * Copy out the verbose bit, if needed. Either way,
 		 * increment the output pointer the correct amount.
 		 */
 		if (log_entry->tlm_buf.tlb_eventflags & TLB_FLAG_VERBOSE) {
 			error = tcp_log_copyout(sopt, &log_entry->tlm_v,
 			    out_entry->tlb_verbose,
 			    sizeof(struct tcp_log_verbose));
 			if (error)
 				break;
 			out_entry = (struct tcp_log_buffer *)
 			    (((uint8_t *) (out_entry + 1)) +
 			    sizeof(struct tcp_log_verbose));
 		} else
 			out_entry++;
 	}
 	*end = out_entry;
 	KASSERT(error || count == 0,
 	    ("%s:%d: Less than expected count (%d) processing list %p"
 	    " (%d remain)", __func__, __LINE__, orig_count,
 	    log_tailqp, count));
 
 	return (error);
 }
 
 /*
  * Copy out the buffer. Note that we do incremental copying, so
  * sooptcopyout() won't work. However, the goal is to produce the same
  * end result as if we copied in the entire user buffer, updated it,
  * and then used sooptcopyout() to copy it out.
  *
  * NOTE: This should be called with a write lock on the PCB; however,
  * the function will drop it after it extracts the data from the TCPCB.
  */
 int
 tcp_log_getlogbuf(struct sockopt *sopt, struct tcpcb *tp)
 {
 	struct tcp_log_stailq log_tailq;
 	struct tcp_log_mem *log_entry, *log_next;
 	struct tcp_log_buffer *out_entry;
 	struct inpcb *inp = tptoinpcb(tp);
 	size_t outsize, entrysize;
 	int error, outnum;
 
 	INP_WLOCK_ASSERT(inp);
 
 	/*
 	 * Determine which log entries will fit in the buffer. As an
 	 * optimization, skip this if all the entries will clearly fit
 	 * in the buffer. (However, get an exact size if we are using
 	 * INVARIANTS.)
 	 */
 #ifndef INVARIANTS
 	if (sopt->sopt_valsize / (sizeof(struct tcp_log_buffer) +
 	    sizeof(struct tcp_log_verbose)) >= tp->t_lognum) {
 		log_entry = STAILQ_LAST(&tp->t_logs, tcp_log_mem, tlm_queue);
 		log_next = NULL;
 		outsize = 0;
 		outnum = tp->t_lognum;
 	} else {
 #endif
 		outsize = outnum = 0;
 		log_entry = NULL;
 		STAILQ_FOREACH(log_next, &tp->t_logs, tlm_queue) {
 			entrysize = sizeof(struct tcp_log_buffer);
 			if (log_next->tlm_buf.tlb_eventflags &
 			    TLB_FLAG_VERBOSE)
 				entrysize += sizeof(struct tcp_log_verbose);
 			if ((sopt->sopt_valsize - outsize) < entrysize)
 				break;
 			outsize += entrysize;
 			outnum++;
 			log_entry = log_next;
 		}
 		KASSERT(outsize <= sopt->sopt_valsize,
 		    ("%s: calculated output size (%zu) greater than available"
 			"space (%zu)", __func__, outsize, sopt->sopt_valsize));
 #ifndef INVARIANTS
 	}
 #endif
 
 	/*
 	 * Copy traditional sooptcopyout() behavior: if sopt->sopt_val
 	 * is NULL, silently skip the copy. However, in this case, we
 	 * will leave the list alone and return. Functionally, this
 	 * gives userspace a way to poll for an approximate buffer
 	 * size they will need to get the log entries.
 	 */
 	if (sopt->sopt_val == NULL) {
 		INP_WUNLOCK(inp);
 		if (outsize == 0) {
 			outsize = outnum * (sizeof(struct tcp_log_buffer) +
 			    sizeof(struct tcp_log_verbose));
 		}
 		if (sopt->sopt_valsize > outsize)
 			sopt->sopt_valsize = outsize;
 		return (0);
 	}
 
 	/*
 	 * Break apart the list. We'll save the ones we want to copy
 	 * out locally and remove them from the TCPCB list. We can
 	 * then drop the INPCB lock while we do the copyout.
 	 *
 	 * There are roughly three cases:
 	 * 1. There was nothing to copy out. That's easy: drop the
 	 * lock and return.
 	 * 2. We are copying out the entire list. Again, that's easy:
 	 * move the whole list.
 	 * 3. We are copying out a partial list. That's harder. We
 	 * need to update the list book-keeping entries.
 	 */
 	if (log_entry != NULL && log_next == NULL) {
 		/* Move entire list. */
 		KASSERT(outnum == tp->t_lognum,
 		    ("%s:%d: outnum (%d) should match tp->t_lognum (%d)",
 			__func__, __LINE__, outnum, tp->t_lognum));
 		log_tailq = tp->t_logs;
 		tp->t_lognum = 0;
 		STAILQ_INIT(&tp->t_logs);
 	} else if (log_entry != NULL) {
 		/* Move partial list. */
 		KASSERT(outnum < tp->t_lognum,
 		    ("%s:%d: outnum (%d) not less than tp->t_lognum (%d)",
 			__func__, __LINE__, outnum, tp->t_lognum));
 		STAILQ_FIRST(&log_tailq) = STAILQ_FIRST(&tp->t_logs);
 		STAILQ_FIRST(&tp->t_logs) = STAILQ_NEXT(log_entry, tlm_queue);
 		KASSERT(STAILQ_NEXT(log_entry, tlm_queue) != NULL,
 		    ("%s:%d: tp->t_logs is unexpectedly shorter than expected"
 		    "(tp: %p, log_tailq: %p, outnum: %d, tp->t_lognum: %d)",
 		    __func__, __LINE__, tp, &log_tailq, outnum, tp->t_lognum));
 		STAILQ_NEXT(log_entry, tlm_queue) = NULL;
 		log_tailq.stqh_last = &STAILQ_NEXT(log_entry, tlm_queue);
 		tp->t_lognum -= outnum;
 	} else
 		STAILQ_INIT(&log_tailq);
 
 	/* Drop the PCB lock. */
 	INP_WUNLOCK(inp);
 
 	/* Copy the data out. */
 	error = tcp_log_logs_to_buf(sopt, &log_tailq, &out_entry, outnum);
 
 	if (error) {
 		/* Restore list */
 		INP_WLOCK(inp);
 		if ((inp->inp_flags & INP_DROPPED) == 0) {
 			tp = intotcpcb(inp);
 
 			/* Merge the two lists. */
 			STAILQ_CONCAT(&log_tailq, &tp->t_logs);
 			tp->t_logs = log_tailq;
 			tp->t_lognum += outnum;
 		}
 		INP_WUNLOCK(inp);
 	} else {
 		/* Sanity check entries */
 		KASSERT(((caddr_t)out_entry - (caddr_t)sopt->sopt_val)  ==
 		    outsize, ("%s: Actual output size (%zu) != "
 			"calculated output size (%zu)", __func__,
 			(size_t)((caddr_t)out_entry - (caddr_t)sopt->sopt_val),
 			outsize));
 
 		/* Free the entries we just copied out. */
 		STAILQ_FOREACH_SAFE(log_entry, &log_tailq, tlm_queue, log_next) {
 			tcp_log_entry_refcnt_rem(log_entry);
 			uma_zfree(tcp_log_zone, log_entry);
 		}
 	}
 
 	sopt->sopt_valsize = (size_t)((caddr_t)out_entry -
 	    (caddr_t)sopt->sopt_val);
 	return (error);
 }
 
 static void
 tcp_log_free_queue(struct tcp_log_dev_queue *param)
 {
 	struct tcp_log_dev_log_queue *entry;
 
 	KASSERT(param != NULL, ("%s: called with NULL param", __func__));
 	if (param == NULL)
 		return;
 
 	entry = (struct tcp_log_dev_log_queue *)param;
 
 	/* Free the entries. */
 	tcp_log_free_entries(&entry->tldl_entries, &entry->tldl_count);
 
 	/* Free the buffer, if it is allocated. */
 	if (entry->tldl_common.tldq_buf != NULL)
 		free(entry->tldl_common.tldq_buf, M_TCPLOGDEV);
 
 	/* Free the queue entry. */
 	free(entry, M_TCPLOGDEV);
 }
 
 static struct tcp_log_common_header *
 tcp_log_expandlogbuf(struct tcp_log_dev_queue *param)
 {
 	struct tcp_log_dev_log_queue *entry;
 	struct tcp_log_header *hdr;
 	uint8_t *end;
 	struct sockopt sopt;
 	int error;
 
 	entry = (struct tcp_log_dev_log_queue *)param;
 
 	/* Take a worst-case guess at space needs. */
 	sopt.sopt_valsize = sizeof(struct tcp_log_header) +
 	    entry->tldl_count * (sizeof(struct tcp_log_buffer) +
 	    sizeof(struct tcp_log_verbose));
 	hdr = malloc(sopt.sopt_valsize, M_TCPLOGDEV, M_NOWAIT);
 	if (hdr == NULL) {
 #ifdef TCPLOG_DEBUG_COUNTERS
 		counter_u64_add(tcp_log_que_fail5, entry->tldl_count);
 #endif
 		return (NULL);
 	}
 	sopt.sopt_val = hdr + 1;
 	sopt.sopt_valsize -= sizeof(struct tcp_log_header);
 	sopt.sopt_td = NULL;
 
 	error = tcp_log_logs_to_buf(&sopt, &entry->tldl_entries,
 	    (struct tcp_log_buffer **)&end, entry->tldl_count);
 	if (error) {
 		free(hdr, M_TCPLOGDEV);
 		return (NULL);
 	}
 
 	/* Free the entries. */
 	tcp_log_free_entries(&entry->tldl_entries, &entry->tldl_count);
 	entry->tldl_count = 0;
 
 	memset(hdr, 0, sizeof(struct tcp_log_header));
 	hdr->tlh_version = TCP_LOG_BUF_VER;
 	hdr->tlh_type = TCP_LOG_DEV_TYPE_BBR;
 	hdr->tlh_length = end - (uint8_t *)hdr;
 	hdr->tlh_ie = entry->tldl_ie;
 	hdr->tlh_af = entry->tldl_af;
 	getboottime(&hdr->tlh_offset);
 	strlcpy(hdr->tlh_id, entry->tldl_id, TCP_LOG_ID_LEN);
 	strlcpy(hdr->tlh_tag, entry->tldl_tag, TCP_LOG_TAG_LEN);
 	strlcpy(hdr->tlh_reason, entry->tldl_reason, TCP_LOG_REASON_LEN);
 	return ((struct tcp_log_common_header *)hdr);
 }
 
 /*
  * Queue the tcpcb's log buffer for transmission via the log buffer facility.
  *
  * NOTE: This should be called with a write lock on the PCB.
  *
  * how should be M_WAITOK or M_NOWAIT. If M_WAITOK, the function will drop
  * and reacquire the INP lock if it needs to do so.
  *
  * If force is false, this will only dump auto-logged sessions if
  * tcp_log_auto_all is true or if there is a log ID defined for the session.
  */
 int
 tcp_log_dump_tp_logbuf(struct tcpcb *tp, char *reason, int how, bool force)
 {
 	struct tcp_log_dev_log_queue *entry;
 	struct inpcb *inp = tptoinpcb(tp);
 #ifdef TCPLOG_DEBUG_COUNTERS
 	int num_entries;
 #endif
 
 	INP_WLOCK_ASSERT(inp);
 
 	/* If there are no log entries, there is nothing to do. */
 	if (tp->t_lognum == 0)
 		return (0);
 
 	/* Check for a log ID. */
 	if (tp->t_lib == NULL && (tp->t_flags2 & TF2_LOG_AUTO) &&
 	    !tcp_log_auto_all && !force) {
 		struct tcp_log_mem *log_entry;
 
 		/*
 		 * We needed a log ID and none was found. Free the log entries
 		 * and return success. Also, cancel further logging. If the
 		 * session doesn't have a log ID by now, we'll assume it isn't
 		 * going to get one.
 		 */
 		while ((log_entry = STAILQ_FIRST(&tp->t_logs)) != NULL)
 			tcp_log_remove_log_head(tp, log_entry);
 		KASSERT(tp->t_lognum == 0,
 		    ("%s: After freeing entries, tp->t_lognum=%d (expected 0)",
 			__func__, tp->t_lognum));
 		tp->_t_logstate = TCP_LOG_STATE_OFF;
 		return (0);
 	}
 
 	/*
 	 * Allocate memory. If we must wait, we'll need to drop the locks
 	 * and reacquire them (and do all the related business that goes
 	 * along with that).
 	 */
 	entry = malloc(sizeof(struct tcp_log_dev_log_queue), M_TCPLOGDEV,
 	    M_NOWAIT);
 	if (entry == NULL && (how & M_NOWAIT)) {
 #ifdef TCPLOG_DEBUG_COUNTERS
 		counter_u64_add(tcp_log_que_fail3, 1);
 #endif
 		return (ENOBUFS);
 	}
 	if (entry == NULL) {
 		INP_WUNLOCK(inp);
 		entry = malloc(sizeof(struct tcp_log_dev_log_queue),
 		    M_TCPLOGDEV, M_WAITOK);
 		INP_WLOCK(inp);
 		/*
 		 * Note that this check is slightly overly-restrictive in
 		 * that the TCB can survive either of these events.
 		 * However, there is currently not a good way to ensure
 		 * that is the case. So, if we hit this M_WAIT path, we
 		 * may end up dropping some entries. That seems like a
 		 * small price to pay for safety.
 		 */
 		if (inp->inp_flags & INP_DROPPED) {
 			free(entry, M_TCPLOGDEV);
 #ifdef TCPLOG_DEBUG_COUNTERS
 			counter_u64_add(tcp_log_que_fail2, 1);
 #endif
 			return (ECONNRESET);
 		}
 		tp = intotcpcb(inp);
 		if (tp->t_lognum == 0) {
 			free(entry, M_TCPLOGDEV);
 			return (0);
 		}
 	}
 
 	/* Fill in the unique parts of the queue entry. */
 	if (tp->t_lib != NULL) {
 		strlcpy(entry->tldl_id, tp->t_lib->tlb_id, TCP_LOG_ID_LEN);
 		strlcpy(entry->tldl_tag, tp->t_lib->tlb_tag, TCP_LOG_TAG_LEN);
 	} else {
 		strlcpy(entry->tldl_id, "UNKNOWN", TCP_LOG_ID_LEN);
 		strlcpy(entry->tldl_tag, "UNKNOWN", TCP_LOG_TAG_LEN);
 	}
 	if (reason != NULL)
 		strlcpy(entry->tldl_reason, reason, TCP_LOG_REASON_LEN);
 	else
 		strlcpy(entry->tldl_reason, "UNKNOWN", TCP_LOG_ID_LEN);
 	entry->tldl_ie = inp->inp_inc.inc_ie;
 	if (inp->inp_inc.inc_flags & INC_ISIPV6)
 		entry->tldl_af = AF_INET6;
 	else
 		entry->tldl_af = AF_INET;
 	entry->tldl_entries = tp->t_logs;
 	entry->tldl_count = tp->t_lognum;
 
 	/* Fill in the common parts of the queue entry. */
 	entry->tldl_common.tldq_buf = NULL;
 	entry->tldl_common.tldq_xform = tcp_log_expandlogbuf;
 	entry->tldl_common.tldq_dtor = tcp_log_free_queue;
 
 	/* Clear the log data from the TCPCB. */
 #ifdef TCPLOG_DEBUG_COUNTERS
 	num_entries = tp->t_lognum;
 #endif
 	tp->t_lognum = 0;
 	STAILQ_INIT(&tp->t_logs);
 
 	/* Add the entry. If no one is listening, free the entry. */
 	if (tcp_log_dev_add_log((struct tcp_log_dev_queue *)entry)) {
 		tcp_log_free_queue((struct tcp_log_dev_queue *)entry);
 #ifdef TCPLOG_DEBUG_COUNTERS
 		counter_u64_add(tcp_log_que_fail1, num_entries);
 	} else {
 		counter_u64_add(tcp_log_queued, num_entries);
 #endif
 	}
 	return (0);
 }
 
 /*
  * Queue the log_id_node's log buffers for transmission via the log buffer
  * facility.
  *
  * NOTE: This should be called with the bucket locked and referenced.
  *
  * how should be M_WAITOK or M_NOWAIT. If M_WAITOK, the function will drop
  * and reacquire the bucket lock if it needs to do so. (The caller must
  * ensure that the tln is no longer on any lists so no one else will mess
  * with this while the lock is dropped!)
  */
 static int
 tcp_log_dump_node_logbuf(struct tcp_log_id_node *tln, char *reason, int how)
 {
 	struct tcp_log_dev_log_queue *entry;
 	struct tcp_log_id_bucket *tlb;
 
 	tlb = tln->tln_bucket;
 	TCPID_BUCKET_LOCK_ASSERT(tlb);
 	KASSERT(tlb->tlb_refcnt > 0,
 	    ("%s:%d: Called with unreferenced bucket (tln=%p, tlb=%p)",
 	    __func__, __LINE__, tln, tlb));
 	KASSERT(tln->tln_closed,
 	    ("%s:%d: Called for node with tln_closed==false (tln=%p)",
 	    __func__, __LINE__, tln));
 
 	/* If there are no log entries, there is nothing to do. */
 	if (tln->tln_count == 0)
 		return (0);
 
 	/*
 	 * Allocate memory. If we must wait, we'll need to drop the locks
 	 * and reacquire them (and do all the related business that goes
 	 * along with that).
 	 */
 	entry = malloc(sizeof(struct tcp_log_dev_log_queue), M_TCPLOGDEV,
 	    M_NOWAIT);
 	if (entry == NULL && (how & M_NOWAIT))
 		return (ENOBUFS);
 	if (entry == NULL) {
 		TCPID_BUCKET_UNLOCK(tlb);
 		entry = malloc(sizeof(struct tcp_log_dev_log_queue),
 		    M_TCPLOGDEV, M_WAITOK);
 		TCPID_BUCKET_LOCK(tlb);
 	}
 
 	/* Fill in the common parts of the queue entry.. */
 	entry->tldl_common.tldq_buf = NULL;
 	entry->tldl_common.tldq_xform = tcp_log_expandlogbuf;
 	entry->tldl_common.tldq_dtor = tcp_log_free_queue;
 
 	/* Fill in the unique parts of the queue entry. */
 	strlcpy(entry->tldl_id, tlb->tlb_id, TCP_LOG_ID_LEN);
 	strlcpy(entry->tldl_tag, tlb->tlb_tag, TCP_LOG_TAG_LEN);
 	if (reason != NULL)
 		strlcpy(entry->tldl_reason, reason, TCP_LOG_REASON_LEN);
 	else
 		strlcpy(entry->tldl_reason, "UNKNOWN", TCP_LOG_ID_LEN);
 	entry->tldl_ie = tln->tln_ie;
 	entry->tldl_entries = tln->tln_entries;
 	entry->tldl_count = tln->tln_count;
 	entry->tldl_af = tln->tln_af;
 
 	/* Add the entry. If no one is listening, free the entry. */
 	if (tcp_log_dev_add_log((struct tcp_log_dev_queue *)entry))
 		tcp_log_free_queue((struct tcp_log_dev_queue *)entry);
 
 	return (0);
 }
 
 /*
  * Queue the log buffers for all sessions in a bucket for transmissions via
  * the log buffer facility.
  *
  * NOTE: This should be called with a locked bucket; however, the function
  * will drop the lock.
  */
 #define	LOCAL_SAVE	10
 static void
 tcp_log_dumpbucketlogs(struct tcp_log_id_bucket *tlb, char *reason)
 {
 	struct tcp_log_id_node local_entries[LOCAL_SAVE];
 	struct inpcb *inp;
 	struct tcpcb *tp;
 	struct tcp_log_id_node *cur_tln, *prev_tln, *tmp_tln;
 	int i, num_local_entries, tree_locked;
 	bool expireq_locked;
 
 	TCPID_BUCKET_LOCK_ASSERT(tlb);
 
 	/*
 	 * Take a reference on the bucket to keep it from disappearing until
 	 * we are done.
 	 */
 	TCPID_BUCKET_REF(tlb);
 
 	/*
 	 * We'll try to create these without dropping locks. However, we
 	 * might very well need to drop locks to get memory. If that's the
 	 * case, we'll save up to 10 on the stack, and sacrifice the rest.
 	 * (Otherwise, we need to worry about finding our place again in a
 	 * potentially changed list. It just doesn't seem worth the trouble
 	 * to do that.
 	 */
 	expireq_locked = false;
 	num_local_entries = 0;
 	prev_tln = NULL;
 	tree_locked = TREE_UNLOCKED;
 	SLIST_FOREACH_SAFE(cur_tln, &tlb->tlb_head, tln_list, tmp_tln) {
 		/*
 		 * If this isn't associated with a TCPCB, we can pull it off
 		 * the list now. We need to be careful that the expire timer
 		 * hasn't already taken ownership (tln_expiretime == SBT_MAX).
 		 * If so, we let the expire timer code free the data.
 		 */
 		if (cur_tln->tln_closed) {
 no_inp:
 			/*
 			 * Get the expireq lock so we can get a consistent
 			 * read of tln_expiretime and so we can remove this
 			 * from the expireq.
 			 */
 			if (!expireq_locked) {
 				TCPLOG_EXPIREQ_LOCK();
 				expireq_locked = true;
 			}
 
 			/*
 			 * We ignore entries with tln_expiretime == SBT_MAX.
 			 * The expire timer code already owns those.
 			 */
 			KASSERT(cur_tln->tln_expiretime > (sbintime_t) 0,
 			    ("%s:%d: node on the expire queue without positive "
 			    "expire time", __func__, __LINE__));
 			if (cur_tln->tln_expiretime == SBT_MAX) {
 				prev_tln = cur_tln;
 				continue;
 			}
 
 			/* Remove the entry from the expireq. */
 			STAILQ_REMOVE(&tcp_log_expireq_head, cur_tln,
 			    tcp_log_id_node, tln_expireq);
 
 			/* Remove the entry from the bucket. */
 			if (prev_tln != NULL)
 				SLIST_REMOVE_AFTER(prev_tln, tln_list);
 			else
 				SLIST_REMOVE_HEAD(&tlb->tlb_head, tln_list);
 
 			/*
 			 * Drop the INP and bucket reference counts. Due to
 			 * lock-ordering rules, we need to drop the expire
 			 * queue lock.
 			 */
 			TCPLOG_EXPIREQ_UNLOCK();
 			expireq_locked = false;
 
 			/* Drop the INP reference. */
 			INP_WLOCK(cur_tln->tln_inp);
 			if (!in_pcbrele_wlocked(cur_tln->tln_inp))
 				INP_WUNLOCK(cur_tln->tln_inp);
 
 			if (tcp_log_unref_bucket(tlb, &tree_locked, NULL)) {
 #ifdef INVARIANTS
 				panic("%s: Bucket refcount unexpectedly 0.",
 				    __func__);
 #endif
 				/*
 				 * Recover as best we can: free the entry we
 				 * own.
 				 */
 				tcp_log_free_entries(&cur_tln->tln_entries,
 				    &cur_tln->tln_count);
 				uma_zfree(tcp_log_id_node_zone, cur_tln);
 				goto done;
 			}
 
 			if (tcp_log_dump_node_logbuf(cur_tln, reason,
 			    M_NOWAIT)) {
 				/*
 				 * If we have sapce, save the entries locally.
 				 * Otherwise, free them.
 				 */
 				if (num_local_entries < LOCAL_SAVE) {
 					local_entries[num_local_entries] =
 					    *cur_tln;
 					num_local_entries++;
 				} else {
 					tcp_log_free_entries(
 					    &cur_tln->tln_entries,
 					    &cur_tln->tln_count);
 				}
 			}
 
 			/* No matter what, we are done with the node now. */
 			uma_zfree(tcp_log_id_node_zone, cur_tln);
 
 			/*
 			 * Because we removed this entry from the list, prev_tln
 			 * (which tracks the previous entry still on the tlb
 			 * list) remains unchanged.
 			 */
 			continue;
 		}
 
 		/*
 		 * If we get to this point, the session data is still held in
 		 * the TCPCB. So, we need to pull the data out of that.
 		 *
 		 * We will need to drop the expireq lock so we can lock the INP.
 		 * We can then try to extract the data the "easy" way. If that
 		 * fails, we'll save the log entries for later.
 		 */
 		if (expireq_locked) {
 			TCPLOG_EXPIREQ_UNLOCK();
 			expireq_locked = false;
 		}
 
 		/* Lock the INP and then re-check the state. */
 		inp = cur_tln->tln_inp;
 		INP_WLOCK(inp);
 		/*
 		 * If we caught this while it was transitioning, the data
 		 * might have moved from the TCPCB to the tln (signified by
 		 * setting tln_closed to true. If so, treat this like an
 		 * inactive connection.
 		 */
 		if (cur_tln->tln_closed) {
 			/*
 			 * It looks like we may have caught this connection
 			 * while it was transitioning from active to inactive.
 			 * Treat this like an inactive connection.
 			 */
 			INP_WUNLOCK(inp);
 			goto no_inp;
 		}
 
 		/*
 		 * Try to dump the data from the tp without dropping the lock.
 		 * If this fails, try to save off the data locally.
 		 */
 		tp = cur_tln->tln_tp;
 		if (tcp_log_dump_tp_logbuf(tp, reason, M_NOWAIT, true) &&
 		    num_local_entries < LOCAL_SAVE) {
 			tcp_log_move_tp_to_node(tp,
 			    &local_entries[num_local_entries]);
 			local_entries[num_local_entries].tln_closed = 1;
 			KASSERT(local_entries[num_local_entries].tln_bucket ==
 			    tlb, ("%s: %d: bucket mismatch for node %p",
 			    __func__, __LINE__, cur_tln));
 			num_local_entries++;
 		}
 
 		INP_WUNLOCK(inp);
 
 		/*
 		 * We are goint to leave the current tln on the list. It will
 		 * become the previous tln.
 		 */
 		prev_tln = cur_tln;
 	}
 
 	/* Drop our locks, if any. */
 	KASSERT(tree_locked == TREE_UNLOCKED,
 	    ("%s: %d: tree unexpectedly locked", __func__, __LINE__));
 	switch (tree_locked) {
 	case TREE_WLOCKED:
 		TCPID_TREE_WUNLOCK();
 		tree_locked = TREE_UNLOCKED;
 		break;
 	case TREE_RLOCKED:
 		TCPID_TREE_RUNLOCK();
 		tree_locked = TREE_UNLOCKED;
 		break;
 	}
 	if (expireq_locked) {
 		TCPLOG_EXPIREQ_UNLOCK();
 		expireq_locked = false;
 	}
 
 	/*
 	 * Try again for any saved entries. tcp_log_dump_node_logbuf() is
 	 * guaranteed to free the log entries within the node. And, since
 	 * the node itself is on our stack, we don't need to free it.
 	 */
 	for (i = 0; i < num_local_entries; i++)
 		tcp_log_dump_node_logbuf(&local_entries[i], reason, M_WAITOK);
 
 	/* Drop our reference. */
 	if (!tcp_log_unref_bucket(tlb, &tree_locked, NULL))
 		TCPID_BUCKET_UNLOCK(tlb);
 
 done:
 	/* Drop our locks, if any. */
 	switch (tree_locked) {
 	case TREE_WLOCKED:
 		TCPID_TREE_WUNLOCK();
 		break;
 	case TREE_RLOCKED:
 		TCPID_TREE_RUNLOCK();
 		break;
 	}
 	if (expireq_locked)
 		TCPLOG_EXPIREQ_UNLOCK();
 }
 #undef	LOCAL_SAVE
 
 /*
  * Queue the log buffers for all sessions in a bucket for transmissions via
  * the log buffer facility.
  *
  * NOTE: This should be called with a locked INP; however, the function
  * will drop the lock.
  */
 void
 tcp_log_dump_tp_bucket_logbufs(struct tcpcb *tp, char *reason)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_log_id_bucket *tlb;
 	int tree_locked;
 
 	/* Figure out our bucket and lock it. */
 	INP_WLOCK_ASSERT(inp);
 	tlb = tp->t_lib;
 	if (tlb == NULL) {
 		/*
 		 * No bucket; treat this like a request to dump a single
 		 * session's traces.
 		 */
 		(void)tcp_log_dump_tp_logbuf(tp, reason, M_WAITOK, true);
 		INP_WUNLOCK(inp);
 		return;
 	}
 	TCPID_BUCKET_REF(tlb);
 	INP_WUNLOCK(inp);
 	TCPID_BUCKET_LOCK(tlb);
 
 	/* If we are the last reference, we have nothing more to do here. */
 	tree_locked = TREE_UNLOCKED;
 	if (tcp_log_unref_bucket(tlb, &tree_locked, NULL)) {
 		switch (tree_locked) {
 		case TREE_WLOCKED:
 			TCPID_TREE_WUNLOCK();
 			break;
 		case TREE_RLOCKED:
 			TCPID_TREE_RUNLOCK();
 			break;
 		}
 		return;
 	}
 
 	/* Turn this over to tcp_log_dumpbucketlogs() to finish the work. */
 	tcp_log_dumpbucketlogs(tlb, reason);
 }
 
 /*
  * Mark the end of a flow with the current stack. A stack can add
  * stack-specific info to this trace event by overriding this
  * function (see bbr_log_flowend() for example).
  */
 void
 tcp_log_flowend(struct tcpcb *tp)
 {
 	if (tp->_t_logstate != TCP_LOG_STATE_OFF) {
 		struct socket *so = tptosocket(tp);
 		TCP_LOG_EVENT(tp, NULL, &so->so_rcv, &so->so_snd,
 				TCP_LOG_FLOWEND, 0, 0, NULL, false);
 	}
 }
 
 void
 tcp_log_sendfile(struct socket *so, off_t offset, size_t nbytes, int flags)
 {
 	struct inpcb *inp;
 	struct tcpcb *tp;
 #ifdef TCP_REQUEST_TRK
 	struct tcp_sendfile_track *ent;
 	int i, fnd;
 #endif
 
 	inp = sotoinpcb(so);
 	KASSERT(inp != NULL, ("tcp_log_sendfile: inp == NULL"));
 
 	/* quick check to see if logging is enabled for this connection */
 	tp = intotcpcb(inp);
 	if ((inp->inp_flags & INP_DROPPED) ||
 	    (tp->_t_logstate == TCP_LOG_STATE_OFF)) {
 		return;
 	}
 
 	INP_WLOCK(inp);
 	/* double check log state now that we have the lock */
 	if (inp->inp_flags & INP_DROPPED)
 		goto done;
 	if (tp->_t_logstate != TCP_LOG_STATE_OFF) {
 		struct timeval tv;
 		tcp_log_eventspecific_t log;
 
 		microuptime(&tv);
 		log.u_sf.offset = offset;
 		log.u_sf.length = nbytes;
 		log.u_sf.flags = flags;
 
 		TCP_LOG_EVENTP(tp, NULL,
 		    &tptosocket(tp)->so_rcv,
 		    &tptosocket(tp)->so_snd,
 		    TCP_LOG_SENDFILE, 0, 0, &log, false, &tv);
 	}
 #ifdef TCP_REQUEST_TRK
 	if (tp->t_tcpreq_req == 0) {
 		/* No http requests to track */
 		goto done;
 	}
 	fnd = 0;
 	if (tp->t_tcpreq_closed == 0) {
 		/* No closed end req to track */
 		goto skip_closed_req;
 	}
 	for(i = 0; i < MAX_TCP_TRK_REQ; i++) {
 		/* Lets see if this one can be found */
 		ent = &tp->t_tcpreq_info[i];
 		if (ent->flags == TCP_TRK_TRACK_FLG_EMPTY) {
 			/* Not used */
 			continue;
 		}
 		if (ent->flags & TCP_TRK_TRACK_FLG_OPEN) {
 			/* This pass does not consider open requests */
 			continue;
 		}
 		if (ent->flags & TCP_TRK_TRACK_FLG_COMP) {
 			/* Don't look at what we have completed */
 			continue;
 		}
 		/* If we reach here its a allocated closed end request */
 		if ((ent->start == offset) ||
 		    ((offset > ent->start) && (offset < ent->end))){
 			/* Its within this request?? */
 			fnd = 1;
 		}
 		if (fnd) {
 			/*
 			 * It is at or past the end, its complete.
 			 */
 			ent->flags |= TCP_TRK_TRACK_FLG_SEQV;
 			/*
 			 * When an entry completes we can take (snd_una + sb_cc) and know where
 			 * the end of the range really is. Note that this works since two
 			 * requests must be sequential and sendfile now is complete for *this* request.
 			 * we must use sb_ccc since the data may still be in-flight in TLS.
 			 *
 			 * We always cautiously move the end_seq only if our calculations
 			 * show it happened (just in case sf has the call to here at the wrong
 			 * place). When we go COMP we will stop coming here and hopefully be
 			 * left with the correct end_seq.
 			 */
 			if (SEQ_GT((tp->snd_una + so->so_snd.sb_ccc), ent->end_seq))
 				ent->end_seq = tp->snd_una + so->so_snd.sb_ccc;
 			if ((offset + nbytes) >= ent->end) {
 				ent->flags |= TCP_TRK_TRACK_FLG_COMP;
 				tcp_req_log_req_info(tp, ent, i, TCP_TRK_REQ_LOG_COMPLETE, offset, nbytes);
 			} else {
 				tcp_req_log_req_info(tp, ent, i, TCP_TRK_REQ_LOG_MOREYET, offset, nbytes);
 			}
 			/* We assume that sendfile never sends overlapping requests */
 			goto done;
 		}
 	}
 skip_closed_req:
 	if (!fnd) {
 		/* Ok now lets look for open requests */
 		for(i = 0; i < MAX_TCP_TRK_REQ; i++) {
 			ent = &tp->t_tcpreq_info[i];
 			if (ent->flags == TCP_TRK_TRACK_FLG_EMPTY) {
 				/* Not used */
 				continue;
 			}
 			if ((ent->flags & TCP_TRK_TRACK_FLG_OPEN) == 0)
 				continue;
 			/* If we reach here its an allocated open request */
 			if (ent->start == offset) {
 				/* It begins this request */
 				ent->start_seq = tp->snd_una +
 				    tptosocket(tp)->so_snd.sb_ccc;
 				ent->flags |= TCP_TRK_TRACK_FLG_SEQV;
 				break;
 			} else if (offset > ent->start) {
 				ent->flags |= TCP_TRK_TRACK_FLG_SEQV;
 				break;
 			}
 		}
 	}
 #endif
 done:
 	INP_WUNLOCK(inp);
 }
diff --git a/sys/netinet/tcp_stacks/bbr.c b/sys/netinet/tcp_stacks/bbr.c
index 1e8053afc45c..d9952ba6bd14 100644
--- a/sys/netinet/tcp_stacks/bbr.c
+++ b/sys/netinet/tcp_stacks/bbr.c
@@ -1,14798 +1,14798 @@
 /*-
  * Copyright (c) 2016-2020 Netflix, Inc.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  */
 /**
  * Author: Randall Stewart <rrs@netflix.com>
  * This work is based on the ACM Queue paper
  * BBR - Congestion Based Congestion Control
  * and also numerous discussions with Neal, Yuchung and Van.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include "opt_inet.h"
 #include "opt_inet6.h"
 #include "opt_ipsec.h"
 #include "opt_ratelimit.h"
 #include <sys/param.h>
 #include <sys/arb.h>
 #include <sys/module.h>
 #include <sys/kernel.h>
 #include <sys/libkern.h>
 #ifdef TCP_HHOOK
 #include <sys/hhook.h>
 #endif
 #include <sys/malloc.h>
 #include <sys/mbuf.h>
 #include <sys/proc.h>
 #include <sys/socket.h>
 #include <sys/socketvar.h>
 #include <sys/sysctl.h>
 #include <sys/systm.h>
 #ifdef STATS
 #include <sys/qmath.h>
 #include <sys/tree.h>
 #include <sys/stats.h> /* Must come after qmath.h and tree.h */
 #endif
 #include <sys/refcount.h>
 #include <sys/queue.h>
 #include <sys/eventhandler.h>
 #include <sys/smp.h>
 #include <sys/kthread.h>
 #include <sys/lock.h>
 #include <sys/mutex.h>
 #include <sys/tim_filter.h>
 #include <sys/time.h>
 #include <sys/protosw.h>
 #include <vm/uma.h>
 #include <sys/kern_prefetch.h>
 
 #include <net/route.h>
 #include <net/route/nhop.h>
 #include <net/vnet.h>
 
 #define TCPSTATES		/* for logging */
 
 #include <netinet/in.h>
 #include <netinet/in_kdtrace.h>
 #include <netinet/in_pcb.h>
 #include <netinet/ip.h>
 #include <netinet/ip_icmp.h>	/* required for icmp_var.h */
 #include <netinet/icmp_var.h>	/* for ICMP_BANDLIM */
 #include <netinet/ip_var.h>
 #include <netinet/ip6.h>
 #include <netinet6/in6_pcb.h>
 #include <netinet6/ip6_var.h>
 #define	TCPOUTFLAGS
 #include <netinet/tcp.h>
 #include <netinet/tcp_fsm.h>
 #include <netinet/tcp_seq.h>
 #include <netinet/tcp_timer.h>
 #include <netinet/tcp_var.h>
 #include <netinet/tcpip.h>
 #include <netinet/tcp_hpts.h>
 #include <netinet/cc/cc.h>
 #include <netinet/tcp_log_buf.h>
 #include <netinet/tcp_ratelimit.h>
 #include <netinet/tcp_lro.h>
 #ifdef TCP_OFFLOAD
 #include <netinet/tcp_offload.h>
 #endif
 #ifdef INET6
 #include <netinet6/tcp6_var.h>
 #endif
 #include <netinet/tcp_fastopen.h>
 
 #include <netipsec/ipsec_support.h>
 #include <net/if.h>
 #include <net/if_var.h>
 #include <net/ethernet.h>
 
 #if defined(IPSEC) || defined(IPSEC_SUPPORT)
 #include <netipsec/ipsec.h>
 #include <netipsec/ipsec6.h>
 #endif				/* IPSEC */
 
 #include <netinet/udp.h>
 #include <netinet/udp_var.h>
 #include <machine/in_cksum.h>
 
 #ifdef MAC
 #include <security/mac/mac_framework.h>
 #endif
 
 #include "sack_filter.h"
 #include "tcp_bbr.h"
 #include "rack_bbr_common.h"
 uma_zone_t bbr_zone;
 uma_zone_t bbr_pcb_zone;
 
 struct sysctl_ctx_list bbr_sysctl_ctx;
 struct sysctl_oid *bbr_sysctl_root;
 
 #define	TCPT_RANGESET_NOSLOP(tv, value, tvmin, tvmax) do { \
 	(tv) = (value); \
 	if ((u_long)(tv) < (u_long)(tvmin)) \
 		(tv) = (tvmin); \
 	if ((u_long)(tv) > (u_long)(tvmax)) \
 		(tv) = (tvmax); \
 } while(0)
 
 /*#define BBR_INVARIANT 1*/
 
 /*
  * initial window
  */
 static uint32_t bbr_def_init_win = 10;
 static int32_t bbr_persist_min = 250000;	/* 250ms */
 static int32_t bbr_persist_max = 1000000;	/* 1 Second */
 static int32_t bbr_cwnd_may_shrink = 0;
 static int32_t bbr_cwndtarget_rtt_touse = BBR_RTT_PROP;
 static int32_t bbr_num_pktepo_for_del_limit = BBR_NUM_RTTS_FOR_DEL_LIMIT;
 static int32_t bbr_hardware_pacing_limit = 8000;
 static int32_t bbr_quanta = 3;	/* How much extra quanta do we get? */
 static int32_t bbr_no_retran = 0;
 
 static int32_t bbr_error_base_paceout = 10000; /* usec to pace */
 static int32_t bbr_max_net_error_cnt = 10;
 /* Should the following be dynamic too -- loss wise */
 static int32_t bbr_rtt_gain_thresh = 0;
 /* Measurement controls */
 static int32_t bbr_use_google_algo = 1;
 static int32_t bbr_ts_limiting = 1;
 static int32_t bbr_ts_can_raise = 0;
 static int32_t bbr_do_red = 600;
 static int32_t bbr_red_scale = 20000;
 static int32_t bbr_red_mul = 1;
 static int32_t bbr_red_div = 2;
 static int32_t bbr_red_growth_restrict = 1;
 static int32_t  bbr_target_is_bbunit = 0;
 static int32_t bbr_drop_limit = 0;
 /*
  * How much gain do we need to see to
  * stay in startup?
  */
 static int32_t bbr_marks_rxt_sack_passed = 0;
 static int32_t bbr_start_exit = 25;
 static int32_t bbr_low_start_exit = 25;	/* When we are in reduced gain */
 static int32_t bbr_startup_loss_thresh = 2000;	/* 20.00% loss */
 static int32_t bbr_hptsi_max_mul = 1;	/* These two mul/div assure a min pacing */
 static int32_t bbr_hptsi_max_div = 2;	/* time, 0 means turned off. We need this
 					 * if we go back ever to where the pacer
 					 * has priority over timers.
 					 */
 static int32_t bbr_policer_call_from_rack_to = 0;
 static int32_t bbr_policer_detection_enabled = 1;
 static int32_t bbr_min_measurements_req = 1;	/* We need at least 2
 						 * measurements before we are
 						 * "good" note that 2 == 1.
 						 * This is because we use a >
 						 * comparison. This means if
 						 * min_measure was 0, it takes
 						 * num-measures > min(0) and
 						 * you get 1 measurement and
 						 * you are good. Set to 1, you
 						 * have to have two
 						 * measurements (this is done
 						 * to prevent it from being ok
 						 * to have no measurements). */
 static int32_t bbr_no_pacing_until = 4;
 
 static int32_t bbr_min_usec_delta = 20000;	/* 20,000 usecs */
 static int32_t bbr_min_peer_delta = 20;		/* 20 units */
 static int32_t bbr_delta_percent = 150;		/* 15.0 % */
 
 static int32_t bbr_target_cwnd_mult_limit = 8;
 /*
  * bbr_cwnd_min_val is the number of
  * segments we hold to in the RTT probe
  * state typically 4.
  */
 static int32_t bbr_cwnd_min_val = BBR_PROBERTT_NUM_MSS;
 
 static int32_t bbr_cwnd_min_val_hs = BBR_HIGHSPEED_NUM_MSS;
 
 static int32_t bbr_gain_to_target = 1;
 static int32_t bbr_gain_gets_extra_too = 1;
 /*
  * bbr_high_gain is the 2/ln(2) value we need
  * to double the sending rate in startup. This
  * is used for both cwnd and hptsi gain's.
  */
 static int32_t bbr_high_gain = BBR_UNIT * 2885 / 1000 + 1;
 static int32_t bbr_startup_lower = BBR_UNIT * 1500 / 1000 + 1;
 static int32_t bbr_use_lower_gain_in_startup = 1;
 
 /* thresholds for reduction on drain in sub-states/drain */
 static int32_t bbr_drain_rtt = BBR_SRTT;
 static int32_t bbr_drain_floor = 88;
 static int32_t google_allow_early_out = 1;
 static int32_t google_consider_lost = 1;
 static int32_t bbr_drain_drop_mul = 4;
 static int32_t bbr_drain_drop_div = 5;
 static int32_t bbr_rand_ot = 50;
 static int32_t bbr_can_force_probertt = 0;
 static int32_t bbr_can_adjust_probertt = 1;
 static int32_t bbr_probertt_sets_rtt = 0;
 static int32_t bbr_can_use_ts_for_rtt = 1;
 static int32_t bbr_is_ratio = 0;
 static int32_t bbr_sub_drain_app_limit = 1;
 static int32_t bbr_prtt_slam_cwnd = 1;
 static int32_t bbr_sub_drain_slam_cwnd = 1;
 static int32_t bbr_slam_cwnd_in_main_drain = 1;
 static int32_t bbr_filter_len_sec = 6;	/* How long does the rttProp filter
 					 * hold */
 static uint32_t bbr_rtt_probe_limit = (USECS_IN_SECOND * 4);
 /*
  * bbr_drain_gain is the reverse of the high_gain
  * designed to drain back out the standing queue
  * that is formed in startup by causing a larger
  * hptsi gain and thus drainging the packets
  * in flight.
  */
 static int32_t bbr_drain_gain = BBR_UNIT * 1000 / 2885;
 static int32_t bbr_rttprobe_gain = 192;
 
 /*
  * The cwnd_gain is the default cwnd gain applied when
  * calculating a target cwnd. Note that the cwnd is
  * a secondary factor in the way BBR works (see the
  * paper and think about it, it will take some time).
  * Basically the hptsi_gain spreads the packets out
  * so you never get more than BDP to the peer even
  * if the cwnd is high. In our implemenation that
  * means in non-recovery/retransmission scenarios
  * cwnd will never be reached by the flight-size.
  */
 static int32_t bbr_cwnd_gain = BBR_UNIT * 2;
 static int32_t bbr_tlp_type_to_use = BBR_SRTT;
 static int32_t bbr_delack_time = 100000;	/* 100ms in useconds */
 static int32_t bbr_sack_not_required = 0;	/* set to one to allow non-sack to use bbr */
 static int32_t bbr_initial_bw_bps = 62500;	/* 500kbps in bytes ps */
 static int32_t bbr_ignore_data_after_close = 1;
 static int16_t bbr_hptsi_gain[] = {
 	(BBR_UNIT *5 / 4),
 	(BBR_UNIT * 3 / 4),
 	BBR_UNIT,
 	BBR_UNIT,
 	BBR_UNIT,
 	BBR_UNIT,
 	BBR_UNIT,
 	BBR_UNIT
 };
 int32_t bbr_use_rack_resend_cheat = 1;
 int32_t bbr_sends_full_iwnd = 1;
 
 #define BBR_HPTSI_GAIN_MAX 8
 /*
  * The BBR module incorporates a number of
  * TCP ideas that have been put out into the IETF
  * over the last few years:
  * - Yuchung Cheng's RACK TCP (for which its named) that
  *    will stop us using the number of dup acks and instead
  *    use time as the gage of when we retransmit.
  * - Reorder Detection of RFC4737 and the Tail-Loss probe draft
  *    of Dukkipati et.al.
  * - Van Jacobson's et.al BBR.
  *
  * RACK depends on SACK, so if an endpoint arrives that
  * cannot do SACK the state machine below will shuttle the
  * connection back to using the "default" TCP stack that is
  * in FreeBSD.
  *
  * To implement BBR and RACK the original TCP stack was first decomposed
  * into a functional state machine with individual states
  * for each of the possible TCP connection states. The do_segment
  * functions role in life is to mandate the connection supports SACK
  * initially and then assure that the RACK state matches the conenction
  * state before calling the states do_segment function. Data processing
  * of inbound segments also now happens in the hpts_do_segment in general
  * with only one exception. This is so we can keep the connection on
  * a single CPU.
  *
  * Each state is simplified due to the fact that the original do_segment
  * has been decomposed and we *know* what state we are in (no
  * switches on the state) and all tests for SACK are gone. This
  * greatly simplifies what each state does.
  *
  * TCP output is also over-written with a new version since it
  * must maintain the new rack scoreboard and has had hptsi
  * integrated as a requirment. Still todo is to eliminate the
  * use of the callout_() system and use the hpts for all
  * timers as well.
  */
 static uint32_t bbr_rtt_probe_time = 200000;	/* 200ms in micro seconds */
 static uint32_t bbr_rtt_probe_cwndtarg = 4;	/* How many mss's outstanding */
 static const int32_t bbr_min_req_free = 2;	/* The min we must have on the
 						 * free list */
 static int32_t bbr_tlp_thresh = 1;
 static int32_t bbr_reorder_thresh = 2;
 static int32_t bbr_reorder_fade = 60000000;	/* 0 - never fade, def
 						 * 60,000,000 - 60 seconds */
 static int32_t bbr_pkt_delay = 1000;
 static int32_t bbr_min_to = 1000;	/* Number of usec's minimum timeout */
 static int32_t bbr_incr_timers = 1;
 
 static int32_t bbr_tlp_min = 10000;	/* 10ms in usecs */
 static int32_t bbr_delayed_ack_time = 200000;	/* 200ms in usecs */
 static int32_t bbr_exit_startup_at_loss = 1;
 
 /*
  * bbr_lt_bw_ratio is 1/8th
  * bbr_lt_bw_diff is  < 4 Kbit/sec
  */
 static uint64_t bbr_lt_bw_diff = 4000 / 8;	/* In bytes per second */
 static uint64_t bbr_lt_bw_ratio = 8;	/* For 1/8th */
 static uint32_t bbr_lt_bw_max_rtts = 48;	/* How many rtt's do we use
 						 * the lt_bw for */
 static uint32_t bbr_lt_intvl_min_rtts = 4;	/* Min num of RTT's to measure
 						 * lt_bw */
 static int32_t bbr_lt_intvl_fp = 0;		/* False positive epoch diff */
 static int32_t bbr_lt_loss_thresh = 196;	/* Lost vs delivered % */
 static int32_t bbr_lt_fd_thresh = 100;		/* false detection % */
 
 static int32_t bbr_verbose_logging = 0;
 /*
  * Currently regular tcp has a rto_min of 30ms
  * the backoff goes 12 times so that ends up
  * being a total of 122.850 seconds before a
  * connection is killed.
  */
 static int32_t bbr_rto_min_ms = 30;	/* 30ms same as main freebsd */
 static int32_t bbr_rto_max_sec = 4;	/* 4 seconds */
 
 /****************************************************/
 /* DEFAULT TSO SIZING  (cpu performance impacting)  */
 /****************************************************/
 /* What amount is our formula using to get TSO size */
 static int32_t bbr_hptsi_per_second = 1000;
 
 /*
  * For hptsi under bbr_cross_over connections what is delay
  * target 7ms (in usec) combined with a seg_max of 2
  * gets us close to identical google behavior in
  * TSO size selection (possibly more 1MSS sends).
  */
 static int32_t bbr_hptsi_segments_delay_tar = 7000;
 
 /* Does pacing delay include overhead's in its time calculations? */
 static int32_t bbr_include_enet_oh = 0;
 static int32_t bbr_include_ip_oh = 1;
 static int32_t bbr_include_tcp_oh = 1;
 static int32_t bbr_google_discount = 10;
 
 /* Do we use (nf mode) pkt-epoch to drive us or rttProp? */
 static int32_t bbr_state_is_pkt_epoch = 0;
 static int32_t bbr_state_drain_2_tar = 1;
 /* What is the max the 0 - bbr_cross_over MBPS TSO target
  * can reach using our delay target. Note that this
  * value becomes the floor for the cross over
  * algorithm.
  */
 static int32_t bbr_hptsi_segments_max = 2;
 static int32_t bbr_hptsi_segments_floor = 1;
 static int32_t bbr_hptsi_utter_max = 0;
 
 /* What is the min the 0 - bbr_cross-over MBPS  TSO target can be */
 static int32_t bbr_hptsi_bytes_min = 1460;
 static int32_t bbr_all_get_min = 0;
 
 /* Cross over point from algo-a to algo-b */
 static uint32_t bbr_cross_over = TWENTY_THREE_MBPS;
 
 /* Do we deal with our restart state? */
 static int32_t bbr_uses_idle_restart = 0;
 static int32_t bbr_idle_restart_threshold = 100000;	/* 100ms in useconds */
 
 /* Do we allow hardware pacing? */
 static int32_t bbr_allow_hdwr_pacing = 0;
 static int32_t bbr_hdwr_pace_adjust = 2;	/* multipler when we calc the tso size */
 static int32_t bbr_hdwr_pace_floor = 1;
 static int32_t bbr_hdwr_pacing_delay_cnt = 10;
 
 /****************************************************/
 static int32_t bbr_resends_use_tso = 0;
 static int32_t bbr_tlp_max_resend = 2;
 static int32_t bbr_sack_block_limit = 128;
 
 #define  BBR_MAX_STAT 19
 counter_u64_t bbr_state_time[BBR_MAX_STAT];
 counter_u64_t bbr_state_lost[BBR_MAX_STAT];
 counter_u64_t bbr_state_resend[BBR_MAX_STAT];
 counter_u64_t bbr_stat_arry[BBR_STAT_SIZE];
 counter_u64_t bbr_opts_arry[BBR_OPTS_SIZE];
 counter_u64_t bbr_out_size[TCP_MSS_ACCT_SIZE];
 counter_u64_t bbr_flows_whdwr_pacing;
 counter_u64_t bbr_flows_nohdwr_pacing;
 
 counter_u64_t bbr_nohdwr_pacing_enobuf;
 counter_u64_t bbr_hdwr_pacing_enobuf;
 
 static inline uint64_t bbr_get_bw(struct tcp_bbr *bbr);
 
 /*
  * Static defintions we need for forward declarations.
  */
 static uint32_t
 bbr_get_pacing_length(struct tcp_bbr *bbr, uint16_t gain,
 		      uint32_t useconds_time, uint64_t bw);
 static uint32_t
 bbr_get_a_state_target(struct tcp_bbr *bbr, uint32_t gain);
 static void
 bbr_set_state(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t win);
 static void
 bbr_set_probebw_gains(struct tcp_bbr *bbr,  uint32_t cts, uint32_t losses);
 static void
 bbr_substate_change(struct tcp_bbr *bbr, uint32_t cts, int line,
 		    int dolog);
 static uint32_t
 bbr_get_target_cwnd(struct tcp_bbr *bbr, uint64_t bw, uint32_t gain);
 static void
 bbr_state_change(struct tcp_bbr *bbr, uint32_t cts, int32_t epoch,
 		 int32_t pkt_epoch, uint32_t losses);
 static uint32_t
 bbr_calc_thresh_rack(struct tcp_bbr *bbr, uint32_t srtt, uint32_t cts,
 		     struct bbr_sendmap *rsm);
 static uint32_t
 bbr_initial_cwnd(struct tcp_bbr *bbr, struct tcpcb *tp);
 static uint32_t
 bbr_calc_thresh_tlp(struct tcpcb *tp, struct tcp_bbr *bbr,
 		    struct bbr_sendmap *rsm, uint32_t srtt, uint32_t cts);
 static void
 bbr_exit_persist(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts,
 		 int32_t line);
 static void
 bbr_set_state_target(struct tcp_bbr *bbr, int line);
 static void
 bbr_enter_probe_rtt(struct tcp_bbr *bbr, uint32_t cts, int32_t line);
 static void
 bbr_log_progress_event(struct tcp_bbr *bbr, struct tcpcb *tp, uint32_t tick,
 		       int event, int line);
 static void
 tcp_bbr_tso_size_check(struct tcp_bbr *bbr, uint32_t cts);
 static void
 bbr_setup_red_bw(struct tcp_bbr *bbr, uint32_t cts);
 static void
 bbr_log_rtt_shrinks(struct tcp_bbr *bbr, uint32_t cts, uint32_t applied,
 		    uint32_t rtt, uint32_t line, uint8_t is_start,
 		    uint16_t set);
 static struct bbr_sendmap *
 bbr_find_lowest_rsm(struct tcp_bbr *bbr);
 static __inline uint32_t
 bbr_get_rtt(struct tcp_bbr *bbr, int32_t rtt_type);
 static void
 bbr_log_to_start(struct tcp_bbr *bbr, uint32_t cts, uint32_t to, int32_t slot,
 		 uint8_t which);
 static void
 bbr_log_timer_var(struct tcp_bbr *bbr, int mode, uint32_t cts,
 		  uint32_t time_since_sent, uint32_t srtt,
 		  uint32_t thresh, uint32_t to);
 static void
 bbr_log_hpts_diag(struct tcp_bbr *bbr, uint32_t cts, struct hpts_diag *diag);
 static void
 bbr_log_type_bbrsnd(struct tcp_bbr *bbr, uint32_t len, uint32_t slot,
 		    uint32_t del_by, uint32_t cts, uint32_t sloton,
 		    uint32_t prev_delay);
 static void
 bbr_enter_persist(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts,
 		  int32_t line);
 static void
 bbr_stop_all_timers(struct tcpcb *tp, struct tcp_bbr *bbr);
 static void
 bbr_exit_probe_rtt(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts);
 static void
 bbr_check_probe_rtt_limits(struct tcp_bbr *bbr, uint32_t cts);
 static void
 bbr_timer_cancel(struct tcp_bbr *bbr, int32_t line, uint32_t cts);
 static void
 bbr_log_pacing_delay_calc(struct tcp_bbr *bbr, uint16_t gain, uint32_t len,
 			  uint32_t cts, uint32_t usecs, uint64_t bw,
 			  uint32_t override, int mod);
 static int bbr_ctloutput(struct tcpcb *tp, struct sockopt *sopt);
 
 static inline uint8_t
 bbr_state_val(struct tcp_bbr *bbr)
 {
 	return(bbr->rc_bbr_substate);
 }
 
 static inline uint32_t
 get_min_cwnd(struct tcp_bbr *bbr)
 {
 	int mss;
 
 	mss = min((bbr->rc_tp->t_maxseg - bbr->rc_last_options),
 		  bbr->r_ctl.rc_pace_max_segs);
 	if (bbr_get_rtt(bbr, BBR_RTT_PROP) < BBR_HIGH_SPEED)
 		return (bbr_cwnd_min_val_hs * mss);
 	else
 		return (bbr_cwnd_min_val * mss);
 }
 
 static uint32_t
 bbr_get_persists_timer_val(struct tcpcb *tp, struct tcp_bbr *bbr)
 {
 	uint64_t srtt, var;
 	uint64_t ret_val;
 
 	bbr->r_ctl.rc_hpts_flags |= PACE_TMR_PERSIT;
 	if (tp->t_srtt == 0) {
 		srtt = (uint64_t)BBR_INITIAL_RTO;
 		var = 0;
 	} else {
 		srtt = ((uint64_t)TICKS_2_USEC(tp->t_srtt) >> TCP_RTT_SHIFT);
 		var = ((uint64_t)TICKS_2_USEC(tp->t_rttvar) >> TCP_RTT_SHIFT);
 	}
 	TCPT_RANGESET_NOSLOP(ret_val, ((srtt + var) * tcp_backoff[tp->t_rxtshift]),
 	    bbr_persist_min, bbr_persist_max);
 	return ((uint32_t)ret_val);
 }
 
 static uint32_t
 bbr_timer_start(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * Start the FR timer, we do this based on getting the first one in
 	 * the rc_tmap. Note that if its NULL we must stop the timer. in all
 	 * events we need to stop the running timer (if its running) before
 	 * starting the new one.
 	 */
 	uint32_t thresh, exp, to, srtt, time_since_sent, tstmp_touse;
 	int32_t idx;
 	int32_t is_tlp_timer = 0;
 	struct bbr_sendmap *rsm;
 
 	if (bbr->rc_all_timers_stopped) {
 		/* All timers have been stopped none are to run */
 		return (0);
 	}
 	if (bbr->rc_in_persist) {
 		/* We can't start any timer in persists */
 		return (bbr_get_persists_timer_val(tp, bbr));
 	}
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 	if ((rsm == NULL) ||
 	    ((tp->t_flags & TF_SACK_PERMIT) == 0) ||
 	    (tp->t_state < TCPS_ESTABLISHED)) {
 		/* Nothing on the send map */
 activate_rxt:
 		if (SEQ_LT(tp->snd_una, tp->snd_max) ||
 		    sbavail(&tptosocket(tp)->so_snd)) {
 			uint64_t tov;
 
 			time_since_sent = 0;
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 			if (rsm) {
 				idx = rsm->r_rtr_cnt - 1;
 				if (TSTMP_GEQ(rsm->r_tim_lastsent[idx], bbr->r_ctl.rc_tlp_rxt_last_time))
 					tstmp_touse = rsm->r_tim_lastsent[idx];
 				else
 					tstmp_touse = bbr->r_ctl.rc_tlp_rxt_last_time;
 				if (TSTMP_GT(tstmp_touse, cts))
 				    time_since_sent = cts - tstmp_touse;
 			}
 			bbr->r_ctl.rc_hpts_flags |= PACE_TMR_RXT;
 			if (tp->t_srtt == 0)
 				tov = BBR_INITIAL_RTO;
 			else
 				tov = ((uint64_t)(TICKS_2_USEC(tp->t_srtt) +
 				    ((uint64_t)TICKS_2_USEC(tp->t_rttvar) * (uint64_t)4)) >> TCP_RTT_SHIFT);
 			if (tp->t_rxtshift)
 				tov *= tcp_backoff[tp->t_rxtshift];
 			if (tov > time_since_sent)
 				tov -= time_since_sent;
 			else
 				tov = bbr->r_ctl.rc_min_to;
 			TCPT_RANGESET_NOSLOP(to, tov,
 			    (bbr->r_ctl.rc_min_rto_ms * MS_IN_USEC),
 			    (bbr->rc_max_rto_sec * USECS_IN_SECOND));
 			bbr_log_timer_var(bbr, 2, cts, 0, srtt, 0, to);
 			return (to);
 		}
 		return (0);
 	}
 	if (rsm->r_flags & BBR_ACKED) {
 		rsm = bbr_find_lowest_rsm(bbr);
 		if (rsm == NULL) {
 			/* No lowest? */
 			goto activate_rxt;
 		}
 	}
 	/* Convert from ms to usecs */
 	if (rsm->r_flags & BBR_SACK_PASSED) {
 		if ((tp->t_flags & TF_SENTFIN) &&
 		    ((tp->snd_max - tp->snd_una) == 1) &&
 		    (rsm->r_flags & BBR_HAS_FIN)) {
 			/*
 			 * We don't start a bbr rack timer if all we have is
 			 * a FIN outstanding.
 			 */
 			goto activate_rxt;
 		}
 		srtt = bbr_get_rtt(bbr, BBR_RTT_RACK);
 		thresh = bbr_calc_thresh_rack(bbr, srtt, cts, rsm);
 		idx = rsm->r_rtr_cnt - 1;
 		exp = rsm->r_tim_lastsent[idx] + thresh;
 		if (SEQ_GEQ(exp, cts)) {
 			to = exp - cts;
 			if (to < bbr->r_ctl.rc_min_to) {
 				to = bbr->r_ctl.rc_min_to;
 			}
 		} else {
 			to = bbr->r_ctl.rc_min_to;
 		}
 	} else {
 		/* Ok we need to do a TLP not RACK */
 		if (bbr->rc_tlp_in_progress != 0) {
 			/*
 			 * The previous send was a TLP.
 			 */
 			goto activate_rxt;
 		}
 		rsm = TAILQ_LAST_FAST(&bbr->r_ctl.rc_tmap, bbr_sendmap, r_tnext);
 		if (rsm == NULL) {
 			/* We found no rsm to TLP with. */
 			goto activate_rxt;
 		}
 		if (rsm->r_flags & BBR_HAS_FIN) {
 			/* If its a FIN we don't do TLP */
 			rsm = NULL;
 			goto activate_rxt;
 		}
 		time_since_sent = 0;
 		idx = rsm->r_rtr_cnt - 1;
 		if (TSTMP_GEQ(rsm->r_tim_lastsent[idx], bbr->r_ctl.rc_tlp_rxt_last_time))
 			tstmp_touse = rsm->r_tim_lastsent[idx];
 		else
 			tstmp_touse = bbr->r_ctl.rc_tlp_rxt_last_time;
 		if (TSTMP_GT(tstmp_touse, cts))
 		    time_since_sent = cts - tstmp_touse;
 		is_tlp_timer = 1;
 		srtt = bbr_get_rtt(bbr, bbr_tlp_type_to_use);
 		thresh = bbr_calc_thresh_tlp(tp, bbr, rsm, srtt, cts);
 		if (thresh > time_since_sent)
 			to = thresh - time_since_sent;
 		else
 			to = bbr->r_ctl.rc_min_to;
 		if (to > (((uint32_t)bbr->rc_max_rto_sec) * USECS_IN_SECOND)) {
 			/*
 			 * If the TLP time works out to larger than the max
 			 * RTO lets not do TLP.. just RTO.
 			 */
 			goto activate_rxt;
 		}
 		if ((bbr->rc_tlp_rtx_out == 1) &&
 		    (rsm->r_start == bbr->r_ctl.rc_last_tlp_seq)) {
 			/*
 			 * Second retransmit of the same TLP
 			 * lets not.
 			 */
 			bbr->rc_tlp_rtx_out = 0;
 			goto activate_rxt;
 		}
 		if (rsm->r_start != bbr->r_ctl.rc_last_tlp_seq) {
 			/*
 			 * The tail is no longer the last one I did a probe
 			 * on
 			 */
 			bbr->r_ctl.rc_tlp_seg_send_cnt = 0;
 			bbr->r_ctl.rc_last_tlp_seq = rsm->r_start;
 		}
 	}
 	if (is_tlp_timer == 0) {
 		BBR_STAT_INC(bbr_to_arm_rack);
 		bbr->r_ctl.rc_hpts_flags |= PACE_TMR_RACK;
 	} else {
 		bbr_log_timer_var(bbr, 1, cts, time_since_sent, srtt, thresh, to);
 		if (bbr->r_ctl.rc_tlp_seg_send_cnt > bbr_tlp_max_resend) {
 			/*
 			 * We have exceeded how many times we can retran the
 			 * current TLP timer, switch to the RTO timer.
 			 */
 			goto activate_rxt;
 		} else {
 			BBR_STAT_INC(bbr_to_arm_tlp);
 			bbr->r_ctl.rc_hpts_flags |= PACE_TMR_TLP;
 		}
 	}
 	return (to);
 }
 
 static inline int32_t
 bbr_minseg(struct tcp_bbr *bbr)
 {
 	return (bbr->r_ctl.rc_pace_min_segs - bbr->rc_last_options);
 }
 
 static void
 bbr_start_hpts_timer(struct tcp_bbr *bbr, struct tcpcb *tp, uint32_t cts, int32_t frm, int32_t slot, uint32_t tot_len)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct hpts_diag diag;
 	uint32_t delayed_ack = 0;
 	uint32_t left = 0;
 	uint32_t hpts_timeout;
 	uint8_t stopped;
 	int32_t delay_calc = 0;
 	uint32_t prev_delay = 0;
 
 	if (tcp_in_hpts(tp)) {
 		/* A previous call is already set up */
 		return;
 	}
 	if ((tp->t_state == TCPS_CLOSED) ||
 	    (tp->t_state == TCPS_LISTEN)) {
 		return;
 	}
 	stopped = bbr->rc_tmr_stopped;
 	if (stopped && TSTMP_GT(bbr->r_ctl.rc_timer_exp, cts)) {
 		left = bbr->r_ctl.rc_timer_exp - cts;
 	}
 	bbr->r_ctl.rc_hpts_flags = 0;
 	bbr->r_ctl.rc_timer_exp = 0;
 	prev_delay = bbr->r_ctl.rc_last_delay_val;
 	if (bbr->r_ctl.rc_last_delay_val &&
 	    (slot == 0)) {
 		/*
 		 * If a previous pacer delay was in place we
 		 * are not coming from the output side (where
 		 * we calculate a delay, more likely a timer).
 		 */
 		slot = bbr->r_ctl.rc_last_delay_val;
 		if (TSTMP_GT(cts, bbr->rc_pacer_started)) {
 			/* Compensate for time passed  */
 			delay_calc = cts - bbr->rc_pacer_started;
 			if (delay_calc <= slot)
 				slot -= delay_calc;
 		}
 	}
 	/* Do we have early to make up for by pushing out the pacing time? */
 	if (bbr->r_agg_early_set) {
 		bbr_log_pacing_delay_calc(bbr, 0, bbr->r_ctl.rc_agg_early, cts, slot, 0, bbr->r_agg_early_set, 2);
 		slot += bbr->r_ctl.rc_agg_early;
 		bbr->r_ctl.rc_agg_early = 0;
 		bbr->r_agg_early_set = 0;
 	}
 	/* Are we running a total debt that needs to be compensated for? */
 	if (bbr->r_ctl.rc_hptsi_agg_delay) {
 		if (slot > bbr->r_ctl.rc_hptsi_agg_delay) {
 			/* We nuke the delay */
 			slot -= bbr->r_ctl.rc_hptsi_agg_delay;
 			bbr->r_ctl.rc_hptsi_agg_delay = 0;
 		} else {
 			/* We nuke some of the delay, put in a minimal 100usecs  */
 			bbr->r_ctl.rc_hptsi_agg_delay -= slot;
 			bbr->r_ctl.rc_last_delay_val = slot = 100;
 		}
 	}
 	bbr->r_ctl.rc_last_delay_val = slot;
 	hpts_timeout = bbr_timer_start(tp, bbr, cts);
 	if (tp->t_flags & TF_DELACK) {
 		if (bbr->rc_in_persist == 0) {
 			delayed_ack = bbr_delack_time;
 		} else {
 			/*
 			 * We are in persists and have
 			 * gotten a new data element.
 			 */
 			if (hpts_timeout > bbr_delack_time) {
 				/*
 				 * Lets make the persists timer (which acks)
 				 * be the smaller of hpts_timeout and bbr_delack_time.
 				 */
 				hpts_timeout = bbr_delack_time;
 			}
 		}
 	}
 	if (delayed_ack &&
 	    ((hpts_timeout == 0) ||
 	     (delayed_ack < hpts_timeout))) {
 		/* We need a Delayed ack timer */
 		bbr->r_ctl.rc_hpts_flags = PACE_TMR_DELACK;
 		hpts_timeout = delayed_ack;
 	}
 	if (slot) {
 		/* Mark that we have a pacing timer up */
 		BBR_STAT_INC(bbr_paced_segments);
 		bbr->r_ctl.rc_hpts_flags |= PACE_PKT_OUTPUT;
 	}
 	/*
 	 * If no timers are going to run and we will fall off thfe hptsi
 	 * wheel, we resort to a keep-alive timer if its configured.
 	 */
 	if ((hpts_timeout == 0) &&
 	    (slot == 0)) {
 		if ((V_tcp_always_keepalive || inp->inp_socket->so_options & SO_KEEPALIVE) &&
 		    (tp->t_state <= TCPS_CLOSING)) {
 			/*
 			 * Ok we have no timer (persists, rack, tlp, rxt  or
 			 * del-ack), we don't have segments being paced. So
 			 * all that is left is the keepalive timer.
 			 */
 			if (TCPS_HAVEESTABLISHED(tp->t_state)) {
 				hpts_timeout = TICKS_2_USEC(TP_KEEPIDLE(tp));
 			} else {
 				hpts_timeout = TICKS_2_USEC(TP_KEEPINIT(tp));
 			}
 			bbr->r_ctl.rc_hpts_flags |= PACE_TMR_KEEP;
 		}
 	}
 	if (left && (stopped & (PACE_TMR_KEEP | PACE_TMR_DELACK)) ==
 	    (bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK)) {
 		/*
 		 * RACK, TLP, persists and RXT timers all are restartable
 		 * based on actions input .. i.e we received a packet (ack
 		 * or sack) and that changes things (rw, or snd_una etc).
 		 * Thus we can restart them with a new value. For
 		 * keep-alive, delayed_ack we keep track of what was left
 		 * and restart the timer with a smaller value.
 		 */
 		if (left < hpts_timeout)
 			hpts_timeout = left;
 	}
 	if (bbr->r_ctl.rc_incr_tmrs && slot &&
 	    (bbr->r_ctl.rc_hpts_flags & (PACE_TMR_TLP|PACE_TMR_RXT))) {
 		/*
 		 * If configured to do so, and the timer is either
 		 * the TLP or RXT timer, we need to increase the timeout
 		 * by the pacing time. Consider the bottleneck at my
 		 * machine as an example, we are sending something
 		 * to start a TLP on. The last packet won't be emitted
 		 * fully until the pacing time (the bottleneck will hold
 		 * the data in place). Once the packet is emitted that
 		 * is when we want to start waiting for the TLP. This
 		 * is most evident with hardware pacing (where the nic
 		 * is holding the packet(s) before emitting). But it
 		 * can also show up in the network so we do it for all
 		 * cases. Technically we would take off one packet from
 		 * this extra delay but this is easier and being more
 		 * conservative is probably better.
 		 */
 		hpts_timeout += slot;
 	}
 	if (hpts_timeout) {
 		/*
 		 * Hack alert for now we can't time-out over 2147 seconds (a
 		 * bit more than 35min)
 		 */
 		if (hpts_timeout > 0x7ffffffe)
 			hpts_timeout = 0x7ffffffe;
 		bbr->r_ctl.rc_timer_exp = cts + hpts_timeout;
 	} else
 		bbr->r_ctl.rc_timer_exp = 0;
 	if ((slot) &&
 	    (bbr->rc_use_google ||
 	     bbr->output_error_seen ||
 	     (slot <= hpts_timeout))  ) {
 		/*
 		 * Tell LRO that it can queue packets while
 		 * we pace.
 		 */
 		bbr->rc_tp->t_flags2 |= TF2_MBUF_QUEUE_READY;
 		if ((bbr->r_ctl.rc_hpts_flags & PACE_TMR_RACK) &&
 		    (bbr->rc_cwnd_limited == 0)) {
 			/*
 			 * If we are not cwnd limited and we
 			 * are running a rack timer we put on
 			 * the do not disturbe even for sack.
 			 */
 			tp->t_flags2 |= TF2_DONT_SACK_QUEUE;
 		} else
 			tp->t_flags2 &= ~TF2_DONT_SACK_QUEUE;
 		bbr->rc_pacer_started = cts;
 
 		(void)tcp_hpts_insert_diag(tp, HPTS_USEC_TO_SLOTS(slot),
 					   __LINE__, &diag);
 		bbr->rc_timer_first = 0;
 		bbr->bbr_timer_src = frm;
 		bbr_log_to_start(bbr, cts, hpts_timeout, slot, 1);
 		bbr_log_hpts_diag(bbr, cts, &diag);
 	} else if (hpts_timeout) {
 		(void)tcp_hpts_insert_diag(tp, HPTS_USEC_TO_SLOTS(hpts_timeout),
 					   __LINE__, &diag);
 		/*
 		 * We add the flag here as well if the slot is set,
 		 * since hpts will call in to clear the queue first before
 		 * calling the output routine (which does our timers).
 		 * We don't want to set the flag if its just a timer
 		 * else the arrival of data might (that causes us
 		 * to send more) might get delayed. Imagine being
 		 * on a keep-alive timer and a request comes in for
 		 * more data.
 		 */
 		if (slot)
 			bbr->rc_pacer_started = cts;
 		if ((bbr->r_ctl.rc_hpts_flags & PACE_TMR_RACK) &&
 		    (bbr->rc_cwnd_limited == 0)) {
 			/*
 			 * For a rack timer, don't wake us even
 			 * if a sack arrives as long as we are
 			 * not cwnd limited.
 			 */
 			tp->t_flags2 |= (TF2_MBUF_QUEUE_READY |
 			    TF2_DONT_SACK_QUEUE);
 		} else {
 			/* All other timers wake us up */
 			tp->t_flags2 &= ~(TF2_MBUF_QUEUE_READY |
 			    TF2_DONT_SACK_QUEUE);
 		}
 		bbr->bbr_timer_src = frm;
 		bbr_log_to_start(bbr, cts, hpts_timeout, slot, 0);
 		bbr_log_hpts_diag(bbr, cts, &diag);
 		bbr->rc_timer_first = 1;
 	}
 	bbr->rc_tmr_stopped = 0;
 	bbr_log_type_bbrsnd(bbr, tot_len, slot, delay_calc, cts, frm, prev_delay);
 }
 
 static void
 bbr_timer_audit(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts, struct sockbuf *sb)
 {
 	/*
 	 * We received an ack, and then did not call send or were bounced
 	 * out due to the hpts was running. Now a timer is up as well, is it
 	 * the right timer?
 	 */
 	struct inpcb *inp;
 	struct bbr_sendmap *rsm;
 	uint32_t hpts_timeout;
 	int tmr_up;
 
 	tmr_up = bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK;
 	if (bbr->rc_in_persist && (tmr_up == PACE_TMR_PERSIT))
 		return;
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 	if (((rsm == NULL) || (tp->t_state < TCPS_ESTABLISHED)) &&
 	    (tmr_up == PACE_TMR_RXT)) {
 		/* Should be an RXT */
 		return;
 	}
 	inp = bbr->rc_inp;
 	if (rsm == NULL) {
 		/* Nothing outstanding? */
 		if (tp->t_flags & TF_DELACK) {
 			if (tmr_up == PACE_TMR_DELACK)
 				/*
 				 * We are supposed to have delayed ack up
 				 * and we do
 				 */
 				return;
 		} else if (sbavail(&inp->inp_socket->so_snd) &&
 		    (tmr_up == PACE_TMR_RXT)) {
 			/*
 			 * if we hit enobufs then we would expect the
 			 * possibility of nothing outstanding and the RXT up
 			 * (and the hptsi timer).
 			 */
 			return;
 		} else if (((V_tcp_always_keepalive ||
 			    inp->inp_socket->so_options & SO_KEEPALIVE) &&
 			    (tp->t_state <= TCPS_CLOSING)) &&
 			    (tmr_up == PACE_TMR_KEEP) &&
 		    (tp->snd_max == tp->snd_una)) {
 			/* We should have keep alive up and we do */
 			return;
 		}
 	}
 	if (rsm && (rsm->r_flags & BBR_SACK_PASSED)) {
 		if ((tp->t_flags & TF_SENTFIN) &&
 		    ((tp->snd_max - tp->snd_una) == 1) &&
 		    (rsm->r_flags & BBR_HAS_FIN)) {
 			/* needs to be a RXT */
 			if (tmr_up == PACE_TMR_RXT)
 				return;
 			else
 				goto wrong_timer;
 		} else if (tmr_up == PACE_TMR_RACK)
 			return;
 		else
 			goto wrong_timer;
 	} else if (rsm && (tmr_up == PACE_TMR_RACK)) {
 		/* Rack timer has priority if we have data out */
 		return;
 	} else if (SEQ_GT(tp->snd_max, tp->snd_una) &&
 		    ((tmr_up == PACE_TMR_TLP) ||
 	    (tmr_up == PACE_TMR_RXT))) {
 		/*
 		 * Either a TLP or RXT is fine if no sack-passed is in place
 		 * and data is outstanding.
 		 */
 		return;
 	} else if (tmr_up == PACE_TMR_DELACK) {
 		/*
 		 * If the delayed ack was going to go off before the
 		 * rtx/tlp/rack timer were going to expire, then that would
 		 * be the timer in control. Note we don't check the time
 		 * here trusting the code is correct.
 		 */
 		return;
 	}
 	if (SEQ_GT(tp->snd_max, tp->snd_una) &&
 	    ((tmr_up == PACE_TMR_RXT) ||
 	     (tmr_up == PACE_TMR_TLP) ||
 	     (tmr_up == PACE_TMR_RACK))) {
 		/*
 		 * We have outstanding data and
 		 * we *do* have a RACK, TLP or RXT
 		 * timer running. We won't restart
 		 * anything here since thats probably ok we
 		 * will get called with some timer here shortly.
 		 */
 		return;
 	}
 	/*
 	 * Ok the timer originally started is not what we want now. We will
 	 * force the hpts to be stopped if any, and restart with the slot
 	 * set to what was in the saved slot.
 	 */
 wrong_timer:
 	if ((bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) == 0) {
 		if (tcp_in_hpts(tp))
 			tcp_hpts_remove(tp);
 		bbr_timer_cancel(bbr, __LINE__, cts);
 		bbr_start_hpts_timer(bbr, tp, cts, 1, bbr->r_ctl.rc_last_delay_val,
 		    0);
 	} else {
 		/*
 		 * Output is hptsi so we just need to switch the type of
 		 * timer. We don't bother with keep-alive, since when we
 		 * jump through the output, it will start the keep-alive if
 		 * nothing is sent.
 		 *
 		 * We only need a delayed-ack added and or the hpts_timeout.
 		 */
 		hpts_timeout = bbr_timer_start(tp, bbr, cts);
 		if (tp->t_flags & TF_DELACK) {
 			if (hpts_timeout == 0) {
 				hpts_timeout = bbr_delack_time;
 				bbr->r_ctl.rc_hpts_flags = PACE_TMR_DELACK;
 			}
 			else if (hpts_timeout > bbr_delack_time) {
 				hpts_timeout = bbr_delack_time;
 				bbr->r_ctl.rc_hpts_flags = PACE_TMR_DELACK;
 			}
 		}
 		if (hpts_timeout) {
 			if (hpts_timeout > 0x7ffffffe)
 				hpts_timeout = 0x7ffffffe;
 			bbr->r_ctl.rc_timer_exp = cts + hpts_timeout;
 		}
 	}
 }
 
 int32_t bbr_clear_lost = 0;
 
 /*
  * Considers the two time values now (cts) and earlier.
  * If cts is smaller than earlier, we could have
  * had a sequence wrap (our counter wraps every
  * 70 min or so) or it could be just clock skew
  * getting us two different time values. Clock skew
  * will show up within 10ms or so. So in such
  * a case (where cts is behind earlier time by
  * less than 10ms) we return 0. Otherwise we
  * return the true difference between them.
  */
 static inline uint32_t
 bbr_calc_time(uint32_t cts, uint32_t earlier_time) {
 	/*
 	 * Given two timestamps, the current time stamp cts, and some other
 	 * time-stamp taken in theory earlier return the difference. The
 	 * trick is here sometimes locking will get the other timestamp
 	 * after the cts. If this occurs we need to return 0.
 	 */
 	if (TSTMP_GEQ(cts, earlier_time))
 		return (cts - earlier_time);
 	/*
 	 * cts is behind earlier_time if its less than 10ms consider it 0.
 	 * If its more than 10ms difference then we had a time wrap. Else
 	 * its just the normal locking foo. I wonder if we should not go to
 	 * 64bit TS and get rid of this issue.
 	 */
 	if (TSTMP_GEQ((cts + 10000), earlier_time))
 		return (0);
 	/*
 	 * Ok the time must have wrapped. So we need to answer a large
 	 * amount of time, which the normal subtraction should do.
 	 */
 	return (cts - earlier_time);
 }
 
 static int
 sysctl_bbr_clear_lost(SYSCTL_HANDLER_ARGS)
 {
 	uint32_t stat;
 	int32_t error;
 
 	error = SYSCTL_OUT(req, &bbr_clear_lost, sizeof(uint32_t));
 	if (error || req->newptr == NULL)
 		return error;
 
 	error = SYSCTL_IN(req, &stat, sizeof(uint32_t));
 	if (error)
 		return (error);
 	if (stat == 1) {
 #ifdef BBR_INVARIANTS
 		printf("Clearing BBR lost counters\n");
 #endif
 		COUNTER_ARRAY_ZERO(bbr_state_lost, BBR_MAX_STAT);
 		COUNTER_ARRAY_ZERO(bbr_state_time, BBR_MAX_STAT);
 		COUNTER_ARRAY_ZERO(bbr_state_resend, BBR_MAX_STAT);
 	} else if (stat == 2) {
 #ifdef BBR_INVARIANTS
 		printf("Clearing BBR option counters\n");
 #endif
 		COUNTER_ARRAY_ZERO(bbr_opts_arry, BBR_OPTS_SIZE);
 	} else if (stat == 3) {
 #ifdef BBR_INVARIANTS
 		printf("Clearing BBR stats counters\n");
 #endif
 		COUNTER_ARRAY_ZERO(bbr_stat_arry, BBR_STAT_SIZE);
 	} else if (stat == 4) {
 #ifdef BBR_INVARIANTS
 		printf("Clearing BBR out-size counters\n");
 #endif
 		COUNTER_ARRAY_ZERO(bbr_out_size, TCP_MSS_ACCT_SIZE);
 	}
 	bbr_clear_lost = 0;
 	return (0);
 }
 
 static void
 bbr_init_sysctls(void)
 {
 	struct sysctl_oid *bbr_probertt;
 	struct sysctl_oid *bbr_hptsi;
 	struct sysctl_oid *bbr_measure;
 	struct sysctl_oid *bbr_cwnd;
 	struct sysctl_oid *bbr_timeout;
 	struct sysctl_oid *bbr_states;
 	struct sysctl_oid *bbr_startup;
 	struct sysctl_oid *bbr_policer;
 
 	/* Probe rtt controls */
 	bbr_probertt = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "probertt",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "gain", CTLFLAG_RW,
 	    &bbr_rttprobe_gain, 192,
 	    "What is the filter gain drop in probe_rtt (0=disable)?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "cwnd", CTLFLAG_RW,
 	    &bbr_rtt_probe_cwndtarg, 4,
 	    "How many mss's are outstanding during probe-rtt");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "int", CTLFLAG_RW,
 	    &bbr_rtt_probe_limit, 4000000,
 	    "If RTT has not shrank in this many micro-seconds enter probe-rtt");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "mintime", CTLFLAG_RW,
 	    &bbr_rtt_probe_time, 200000,
 	    "How many microseconds in probe-rtt");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "filter_len_sec", CTLFLAG_RW,
 	    &bbr_filter_len_sec, 6,
 	    "How long in seconds does the rttProp filter run?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "drain_rtt", CTLFLAG_RW,
 	    &bbr_drain_rtt, BBR_SRTT,
 	    "What is the drain rtt to use in probeRTT (rtt_prop=0, rtt_rack=1, rtt_pkt=2, rtt_srtt=3?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "can_force", CTLFLAG_RW,
 	    &bbr_can_force_probertt, 0,
 	    "If we keep setting new low rtt's but delay going in probe-rtt can we force in??");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "enter_sets_force", CTLFLAG_RW,
 	    &bbr_probertt_sets_rtt, 0,
 	    "In NF mode, do we imitate google_mode and set the rttProp on entry to probe-rtt?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "can_adjust", CTLFLAG_RW,
 	    &bbr_can_adjust_probertt, 1,
 	    "Can we dynamically adjust the probe-rtt limits and times?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "is_ratio", CTLFLAG_RW,
 	    &bbr_is_ratio, 0,
 	    "is the limit to filter a ratio?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "use_cwnd", CTLFLAG_RW,
 	    &bbr_prtt_slam_cwnd, 0,
 	    "Should we set/recover cwnd?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_probertt),
 	    OID_AUTO, "can_use_ts", CTLFLAG_RW,
 	    &bbr_can_use_ts_for_rtt, 1,
 	    "Can we use the ms timestamp if available for retransmistted rtt calculations?");
 
 	/* Pacing controls */
 	bbr_hptsi = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "pacing",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "hw_pacing", CTLFLAG_RW,
 	    &bbr_allow_hdwr_pacing, 1,
 	    "Do we allow hardware pacing?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "hw_pacing_limit", CTLFLAG_RW,
 	    &bbr_hardware_pacing_limit, 4000,
 	    "Do we have a limited number of connections for pacing chelsio (0=no limit)?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "hw_pacing_adj", CTLFLAG_RW,
 	    &bbr_hdwr_pace_adjust, 2,
 	    "Multiplier to calculated tso size?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "hw_pacing_floor", CTLFLAG_RW,
 	    &bbr_hdwr_pace_floor, 1,
 	    "Do we invoke the hardware pacing floor?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "hw_pacing_delay_cnt", CTLFLAG_RW,
 	    &bbr_hdwr_pacing_delay_cnt, 10,
 	    "How many packets must be sent after hdwr pacing is enabled");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "bw_cross", CTLFLAG_RW,
 	    &bbr_cross_over, 3000000,
 	    "What is the point where we cross over to linux like TSO size set");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "seg_deltarg", CTLFLAG_RW,
 	    &bbr_hptsi_segments_delay_tar, 7000,
 	    "What is the worse case delay target for hptsi < 48Mbp connections");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "enet_oh", CTLFLAG_RW,
 	    &bbr_include_enet_oh, 0,
 	    "Do we include the ethernet overhead in calculating pacing delay?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "ip_oh", CTLFLAG_RW,
 	    &bbr_include_ip_oh, 1,
 	    "Do we include the IP overhead in calculating pacing delay?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "tcp_oh", CTLFLAG_RW,
 	    &bbr_include_tcp_oh, 0,
 	    "Do we include the TCP overhead in calculating pacing delay?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "google_discount", CTLFLAG_RW,
 	    &bbr_google_discount, 10,
 	    "What is the default google discount percentage wise for pacing (11 = 1.1%%)?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "all_get_min", CTLFLAG_RW,
 	    &bbr_all_get_min, 0,
 	    "If you are less than a MSS do you just get the min?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "tso_min", CTLFLAG_RW,
 	    &bbr_hptsi_bytes_min, 1460,
 	    "For 0 -> 24Mbps what is floor number of segments for TSO");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "seg_tso_max", CTLFLAG_RW,
 	    &bbr_hptsi_segments_max, 6,
 	    "For 0 -> 24Mbps what is top number of segments for TSO");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "seg_floor", CTLFLAG_RW,
 	    &bbr_hptsi_segments_floor, 1,
 	    "Minimum TSO size we will fall too in segments");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "utter_max", CTLFLAG_RW,
 	    &bbr_hptsi_utter_max, 0,
 	    "The absolute maximum that any pacing (outside of hardware) can be");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "seg_divisor", CTLFLAG_RW,
 	    &bbr_hptsi_per_second, 100,
 	    "What is the divisor in our hptsi TSO calculation 512Mbps < X > 24Mbps ");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "srtt_mul", CTLFLAG_RW,
 	    &bbr_hptsi_max_mul, 1,
 	    "The multiplier for pace len max");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_hptsi),
 	    OID_AUTO, "srtt_div", CTLFLAG_RW,
 	    &bbr_hptsi_max_div, 2,
 	    "The divisor for pace len max");
 	/* Measurement controls */
 	bbr_measure = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "measure",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "Measurement controls");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "min_i_bw", CTLFLAG_RW,
 	    &bbr_initial_bw_bps, 62500,
 	    "Minimum initial b/w in bytes per second");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "no_sack_needed", CTLFLAG_RW,
 	    &bbr_sack_not_required, 0,
 	    "Do we allow bbr to run on connections not supporting SACK?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "use_google", CTLFLAG_RW,
 	    &bbr_use_google_algo, 0,
 	    "Use has close to google V1.0 has possible?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "ts_limiting", CTLFLAG_RW,
 	    &bbr_ts_limiting, 1,
 	    "Do we attempt to use the peers timestamp to limit b/w caculations?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "ts_can_raise", CTLFLAG_RW,
 	    &bbr_ts_can_raise, 0,
 	    "Can we raise the b/w via timestamp b/w calculation?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "ts_delta", CTLFLAG_RW,
 	    &bbr_min_usec_delta, 20000,
 	    "How long in usec between ts of our sends in ts validation code?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "ts_peer_delta", CTLFLAG_RW,
 	    &bbr_min_peer_delta, 20,
 	    "What min numerical value should be between the peer deltas?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "ts_delta_percent", CTLFLAG_RW,
 	    &bbr_delta_percent, 150,
 	    "What percentage (150 = 15.0) do we allow variance for?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "min_measure_good_bw", CTLFLAG_RW,
 	    &bbr_min_measurements_req, 1,
 	    "What is the minimum measurement count we need before we switch to our b/w estimate");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "min_measure_before_pace", CTLFLAG_RW,
 	    &bbr_no_pacing_until, 4,
 	    "How many pkt-epoch's (0 is off) do we need before pacing is on?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "quanta", CTLFLAG_RW,
 	    &bbr_quanta, 2,
 	    "Extra quanta to add when calculating the target (ID section 4.2.3.2).");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_measure),
 	    OID_AUTO, "noretran", CTLFLAG_RW,
 	    &bbr_no_retran, 0,
 	    "Should google mode not use retransmission measurements for the b/w estimation?");
 	/* State controls */
 	bbr_states = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "states",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "State controls");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "idle_restart", CTLFLAG_RW,
 	    &bbr_uses_idle_restart, 0,
 	    "Do we use a new special idle_restart state to ramp back up quickly?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "idle_restart_threshold", CTLFLAG_RW,
 	    &bbr_idle_restart_threshold, 100000,
 	    "How long must we be idle before we restart??");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "use_pkt_epoch", CTLFLAG_RW,
 	    &bbr_state_is_pkt_epoch, 0,
 	    "Do we use a pkt-epoch for substate if 0 rttProp?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "startup_rtt_gain", CTLFLAG_RW,
 	    &bbr_rtt_gain_thresh, 0,
 	    "What increase in RTT triggers us to stop ignoring no-loss and possibly exit startup?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "drain_floor", CTLFLAG_RW,
 	    &bbr_drain_floor, 88,
 	    "What is the lowest we can drain (pg) too?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "drain_2_target", CTLFLAG_RW,
 	    &bbr_state_drain_2_tar, 1,
 	    "Do we drain to target in drain substate?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "gain_2_target", CTLFLAG_RW,
 	    &bbr_gain_to_target, 1,
 	    "Does probe bw gain to target??");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "gain_extra_time", CTLFLAG_RW,
 	    &bbr_gain_gets_extra_too, 1,
 	    "Does probe bw gain get the extra time too?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "ld_div", CTLFLAG_RW,
 	    &bbr_drain_drop_div, 5,
 	    "Long drain drop divider?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "ld_mul", CTLFLAG_RW,
 	    &bbr_drain_drop_mul, 4,
 	    "Long drain drop multiplier?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "rand_ot_disc", CTLFLAG_RW,
 	    &bbr_rand_ot, 50,
 	    "Random discount of the ot?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "dr_filter_life", CTLFLAG_RW,
 	    &bbr_num_pktepo_for_del_limit, BBR_NUM_RTTS_FOR_DEL_LIMIT,
 	    "How many packet-epochs does the b/w delivery rate last?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "subdrain_applimited", CTLFLAG_RW,
 	    &bbr_sub_drain_app_limit, 0,
 	    "Does our sub-state drain invoke app limited if its long?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "use_cwnd_subdrain", CTLFLAG_RW,
 	    &bbr_sub_drain_slam_cwnd, 0,
 	    "Should we set/recover cwnd for sub-state drain?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "use_cwnd_maindrain", CTLFLAG_RW,
 	    &bbr_slam_cwnd_in_main_drain, 0,
 	    "Should we set/recover cwnd for main-state drain?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "google_gets_earlyout", CTLFLAG_RW,
 	    &google_allow_early_out, 1,
 	    "Should we allow google probe-bw/drain to exit early at flight target?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_states),
 	    OID_AUTO, "google_exit_loss", CTLFLAG_RW,
 	    &google_consider_lost, 1,
 	    "Should we have losses exit gain of probebw in google mode??");
 	/* Startup controls */
 	bbr_startup = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "startup",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "Startup controls");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "cheat_iwnd", CTLFLAG_RW,
 	    &bbr_sends_full_iwnd, 1,
 	    "Do we not pace but burst out initial windows has our TSO size?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "loss_threshold", CTLFLAG_RW,
 	    &bbr_startup_loss_thresh, 2000,
 	    "In startup what is the loss threshold in a pe that will exit us from startup?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "use_lowerpg", CTLFLAG_RW,
 	    &bbr_use_lower_gain_in_startup, 1,
 	    "Should we use a lower hptsi gain if we see loss in startup?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "gain", CTLFLAG_RW,
 	    &bbr_start_exit, 25,
 	    "What gain percent do we need to see to stay in startup??");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "low_gain", CTLFLAG_RW,
 	    &bbr_low_start_exit, 15,
 	    "What gain percent do we need to see to stay in the lower gain startup??");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_startup),
 	    OID_AUTO, "loss_exit", CTLFLAG_RW,
 	    &bbr_exit_startup_at_loss, 1,
 	    "Should we exit startup at loss in an epoch if we are not gaining?");
 	/* CWND controls */
 	bbr_cwnd = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "cwnd",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "Cwnd controls");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "tar_rtt", CTLFLAG_RW,
 	    &bbr_cwndtarget_rtt_touse, 0,
 	    "Target cwnd rtt measurement to use (0=rtt_prop, 1=rtt_rack, 2=pkt_rtt, 3=srtt)?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "may_shrink", CTLFLAG_RW,
 	    &bbr_cwnd_may_shrink, 0,
 	    "Can the cwnd shrink if it would grow to more than the target?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "max_target_limit", CTLFLAG_RW,
 	    &bbr_target_cwnd_mult_limit, 8,
 	    "Do we limit the cwnd to some multiple of the cwnd target if cwnd can't shrink 0=no?");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "highspeed_min", CTLFLAG_RW,
 	    &bbr_cwnd_min_val_hs, BBR_HIGHSPEED_NUM_MSS,
 	    "What is the high-speed min cwnd (rttProp under 1ms)");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "lowspeed_min", CTLFLAG_RW,
 	    &bbr_cwnd_min_val, BBR_PROBERTT_NUM_MSS,
 	    "What is the min cwnd (rttProp > 1ms)");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "initwin", CTLFLAG_RW,
 	    &bbr_def_init_win, 10,
 	    "What is the BBR initial window, if 0 use tcp version");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "do_loss_red", CTLFLAG_RW,
 	    &bbr_do_red, 600,
 	    "Do we reduce the b/w at exit from recovery based on ratio of prop/srtt (800=80.0, 0=off)?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "red_scale", CTLFLAG_RW,
 	    &bbr_red_scale, 20000,
 	    "What RTT do we scale with?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "red_growslow", CTLFLAG_RW,
 	    &bbr_red_growth_restrict, 1,
 	    "Do we restrict cwnd growth for whats in flight?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "red_div", CTLFLAG_RW,
 	    &bbr_red_div, 2,
 	    "If we reduce whats the divisor?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "red_mul", CTLFLAG_RW,
 	    &bbr_red_mul, 1,
 	    "If we reduce whats the mulitiplier?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "target_is_unit", CTLFLAG_RW,
 	    &bbr_target_is_bbunit, 0,
 	    "Is the state target the pacing_gain or BBR_UNIT?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_cwnd),
 	    OID_AUTO, "drop_limit", CTLFLAG_RW,
 	    &bbr_drop_limit, 0,
 	    "Number of segments limit for drop (0=use min_cwnd w/flight)?");
 
 	/* Timeout controls */
 	bbr_timeout = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "timeout",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "Time out controls");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "delack", CTLFLAG_RW,
 	    &bbr_delack_time, 100000,
 	    "BBR's delayed ack time");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "tlp_uses", CTLFLAG_RW,
 	    &bbr_tlp_type_to_use, 3,
 	    "RTT that TLP uses in its calculations, 0=rttProp, 1=Rack_rtt, 2=pkt_rtt and 3=srtt");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "persmin", CTLFLAG_RW,
 	    &bbr_persist_min, 250000,
 	    "What is the minimum time in microseconds between persists");
 	SYSCTL_ADD_U32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "persmax", CTLFLAG_RW,
 	    &bbr_persist_max, 1000000,
 	    "What is the largest delay in microseconds between persists");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "tlp_minto", CTLFLAG_RW,
 	    &bbr_tlp_min, 10000,
 	    "TLP Min timeout in usecs");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "tlp_dack_time", CTLFLAG_RW,
 	    &bbr_delayed_ack_time, 200000,
 	    "TLP delayed ack compensation value");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "minrto", CTLFLAG_RW,
 	    &bbr_rto_min_ms, 30,
 	    "Minimum RTO in ms");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "maxrto", CTLFLAG_RW,
 	    &bbr_rto_max_sec, 4,
 	    "Maximum RTO in seconds -- should be at least as large as min_rto");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "tlp_retry", CTLFLAG_RW,
 	    &bbr_tlp_max_resend, 2,
 	    "How many times does TLP retry a single segment or multiple with no ACK");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "minto", CTLFLAG_RW,
 	    &bbr_min_to, 1000,
 	    "Minimum rack timeout in useconds");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "pktdelay", CTLFLAG_RW,
 	    &bbr_pkt_delay, 1000,
 	    "Extra RACK time (in useconds) besides reordering thresh");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "incr_tmrs", CTLFLAG_RW,
 	    &bbr_incr_timers, 1,
 	    "Increase the RXT/TLP timer by the pacing time used?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_timeout),
 	    OID_AUTO, "rxtmark_sackpassed", CTLFLAG_RW,
 	    &bbr_marks_rxt_sack_passed, 0,
 	    "Mark sack passed on all those not ack'd when a RXT hits?");
 	/* Policer controls */
 	bbr_policer = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO,
 	    "policer",
 	    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 	    "Policer controls");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "detect_enable", CTLFLAG_RW,
 	    &bbr_policer_detection_enabled, 1,
 	    "Is policer detection enabled??");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "min_pes", CTLFLAG_RW,
 	    &bbr_lt_intvl_min_rtts, 4,
 	    "Minimum number of PE's?");
 	SYSCTL_ADD_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "bwdiff", CTLFLAG_RW,
 	    &bbr_lt_bw_diff, (4000/8),
 	    "Minimal bw diff?");
 	SYSCTL_ADD_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "bwratio", CTLFLAG_RW,
 	    &bbr_lt_bw_ratio, 8,
 	    "Minimal bw diff?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "from_rack_rxt", CTLFLAG_RW,
 	    &bbr_policer_call_from_rack_to, 0,
 	    "Do we call the policer detection code from a rack-timeout?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "false_postive", CTLFLAG_RW,
 	    &bbr_lt_intvl_fp, 0,
 	    "What packet epoch do we do false-positive detection at (0=no)?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "loss_thresh", CTLFLAG_RW,
 	    &bbr_lt_loss_thresh, 196,
 	    "Loss threshold 196 = 19.6%?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_policer),
 	    OID_AUTO, "false_postive_thresh", CTLFLAG_RW,
 	    &bbr_lt_fd_thresh, 100,
 	    "What percentage is the false detection threshold (150=15.0)?");
 	/* All the rest */
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "cheat_rxt", CTLFLAG_RW,
 	    &bbr_use_rack_resend_cheat, 0,
 	    "Do we burst 1ms between sends on retransmissions (like rack)?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "error_paceout", CTLFLAG_RW,
 	    &bbr_error_base_paceout, 10000,
 	    "When we hit an error what is the min to pace out in usec's?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "kill_paceout", CTLFLAG_RW,
 	    &bbr_max_net_error_cnt, 10,
 	    "When we hit this many errors in a row, kill the session?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "data_after_close", CTLFLAG_RW,
 	    &bbr_ignore_data_after_close, 1,
 	    "Do we hold off sending a RST until all pending data is ack'd");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "resend_use_tso", CTLFLAG_RW,
 	    &bbr_resends_use_tso, 0,
 	    "Can resends use TSO?");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "sblklimit", CTLFLAG_RW,
 	    &bbr_sack_block_limit, 128,
 	    "When do we start ignoring small sack blocks");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "bb_verbose", CTLFLAG_RW,
 	    &bbr_verbose_logging, 0,
 	    "Should BBR black box logging be verbose");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "reorder_thresh", CTLFLAG_RW,
 	    &bbr_reorder_thresh, 2,
 	    "What factor for rack will be added when seeing reordering (shift right)");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "reorder_fade", CTLFLAG_RW,
 	    &bbr_reorder_fade, 0,
 	    "Does reorder detection fade, if so how many ms (0 means never)");
 	SYSCTL_ADD_S32(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "rtt_tlp_thresh", CTLFLAG_RW,
 	    &bbr_tlp_thresh, 1,
 	    "what divisor for TLP rtt/retran will be added (1=rtt, 2=1/2 rtt etc)");
 	/* Stats and counters */
 	/* The pacing counters for hdwr/software can't be in the array */
 	bbr_nohdwr_pacing_enobuf = counter_u64_alloc(M_WAITOK);
 	bbr_hdwr_pacing_enobuf = counter_u64_alloc(M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "enob_hdwr_pacing", CTLFLAG_RD,
 	    &bbr_hdwr_pacing_enobuf,
 	    "Total number of enobufs for hardware paced flows");
 	SYSCTL_ADD_COUNTER_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "enob_no_hdwr_pacing", CTLFLAG_RD,
 	    &bbr_nohdwr_pacing_enobuf,
 	    "Total number of enobufs for non-hardware paced flows");
 
 	bbr_flows_whdwr_pacing = counter_u64_alloc(M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "hdwr_pacing", CTLFLAG_RD,
 	    &bbr_flows_whdwr_pacing,
 	    "Total number of hardware paced flows");
 	bbr_flows_nohdwr_pacing = counter_u64_alloc(M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "software_pacing", CTLFLAG_RD,
 	    &bbr_flows_nohdwr_pacing,
 	    "Total number of software paced flows");
 	COUNTER_ARRAY_ALLOC(bbr_stat_arry, BBR_STAT_SIZE, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "stats", CTLFLAG_RD,
 	    bbr_stat_arry, BBR_STAT_SIZE, "BBR Stats");
 	COUNTER_ARRAY_ALLOC(bbr_opts_arry, BBR_OPTS_SIZE, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "opts", CTLFLAG_RD,
 	    bbr_opts_arry, BBR_OPTS_SIZE, "BBR Option Stats");
 	COUNTER_ARRAY_ALLOC(bbr_state_lost, BBR_MAX_STAT, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "lost", CTLFLAG_RD,
 	    bbr_state_lost, BBR_MAX_STAT, "Stats of when losses occur");
 	COUNTER_ARRAY_ALLOC(bbr_state_resend, BBR_MAX_STAT, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "stateresend", CTLFLAG_RD,
 	    bbr_state_resend, BBR_MAX_STAT, "Stats of what states resend");
 	COUNTER_ARRAY_ALLOC(bbr_state_time, BBR_MAX_STAT, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "statetime", CTLFLAG_RD,
 	    bbr_state_time, BBR_MAX_STAT, "Stats of time spent in the states");
 	COUNTER_ARRAY_ALLOC(bbr_out_size, TCP_MSS_ACCT_SIZE, M_WAITOK);
 	SYSCTL_ADD_COUNTER_U64_ARRAY(&bbr_sysctl_ctx, SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "outsize", CTLFLAG_RD,
 	    bbr_out_size, TCP_MSS_ACCT_SIZE, "Size of output calls");
 	SYSCTL_ADD_PROC(&bbr_sysctl_ctx,
 	    SYSCTL_CHILDREN(bbr_sysctl_root),
 	    OID_AUTO, "clrlost", CTLTYPE_UINT | CTLFLAG_RW | CTLFLAG_MPSAFE,
 	    &bbr_clear_lost, 0, sysctl_bbr_clear_lost, "IU", "Clear lost counters");
 }
 
 static void
 bbr_counter_destroy(void)
 {
 	COUNTER_ARRAY_FREE(bbr_stat_arry, BBR_STAT_SIZE);
 	COUNTER_ARRAY_FREE(bbr_opts_arry, BBR_OPTS_SIZE);
 	COUNTER_ARRAY_FREE(bbr_out_size, TCP_MSS_ACCT_SIZE);
 	COUNTER_ARRAY_FREE(bbr_state_lost, BBR_MAX_STAT);
 	COUNTER_ARRAY_FREE(bbr_state_time, BBR_MAX_STAT);
 	COUNTER_ARRAY_FREE(bbr_state_resend, BBR_MAX_STAT);
 	counter_u64_free(bbr_nohdwr_pacing_enobuf);
 	counter_u64_free(bbr_hdwr_pacing_enobuf);
 	counter_u64_free(bbr_flows_whdwr_pacing);
 	counter_u64_free(bbr_flows_nohdwr_pacing);
 
 }
 
 static __inline void
 bbr_fill_in_logging_data(struct tcp_bbr *bbr, struct tcp_log_bbr *l, uint32_t cts)
 {
 	memset(l, 0, sizeof(union tcp_log_stackspecific));
 	l->cur_del_rate = bbr->r_ctl.rc_bbr_cur_del_rate;
 	l->delRate = get_filter_value(&bbr->r_ctl.rc_delrate);
 	l->rttProp = get_filter_value_small(&bbr->r_ctl.rc_rttprop);
 	l->bw_inuse = bbr_get_bw(bbr);
 	l->inflight = ctf_flight_size(bbr->rc_tp,
 			  (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 	l->applimited = bbr->r_ctl.r_app_limited_until;
 	l->delivered = bbr->r_ctl.rc_delivered;
 	l->timeStamp = cts;
 	l->lost = bbr->r_ctl.rc_lost;
 	l->bbr_state = bbr->rc_bbr_state;
 	l->bbr_substate = bbr_state_val(bbr);
 	l->epoch = bbr->r_ctl.rc_rtt_epoch;
 	l->lt_epoch = bbr->r_ctl.rc_lt_epoch;
 	l->pacing_gain = bbr->r_ctl.rc_bbr_hptsi_gain;
 	l->cwnd_gain = bbr->r_ctl.rc_bbr_cwnd_gain;
 	l->inhpts = tcp_in_hpts(bbr->rc_tp);
 	l->use_lt_bw = bbr->rc_lt_use_bw;
 	l->pkts_out = bbr->r_ctl.rc_flight_at_input;
 	l->pkt_epoch = bbr->r_ctl.rc_pkt_epoch;
 }
 
 static void
 bbr_log_type_bw_reduce(struct tcp_bbr *bbr, int reason)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = 0;
 		log.u_bbr.flex2 = 0;
 		log.u_bbr.flex5 = 0;
 		log.u_bbr.flex3 = 0;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_pkt_epoch_loss_rate;
 		log.u_bbr.flex7 = reason;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_bbr_enters_probertt;
 		log.u_bbr.flex8 = 0;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BW_RED_EV, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_rwnd_collapse(struct tcp_bbr *bbr, int seq, int mode, uint32_t count)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = seq;
 		log.u_bbr.flex2 = count;
 		log.u_bbr.flex8 = mode;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_LOWGAIN, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_just_return(struct tcp_bbr *bbr, uint32_t cts, uint32_t tlen, uint8_t hpts_calling,
     uint8_t reason, uint32_t p_maxseg, int len)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = p_maxseg;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_hpts_flags;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_timer_exp;
 		log.u_bbr.flex4 = reason;
 		log.u_bbr.flex5 = bbr->rc_in_persist;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_last_delay_val;
 		log.u_bbr.flex7 = p_maxseg;
 		log.u_bbr.flex8 = bbr->rc_in_persist;
 		log.u_bbr.pkts_out = 0;
 		log.u_bbr.applimited = len;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_JUSTRET, 0,
 		    tlen, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_enter_rec(struct tcp_bbr *bbr, uint32_t seq)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = seq;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_cwnd_on_ent;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_recovery_start;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_ENTREC, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_msgsize_fail(struct tcp_bbr *bbr, struct tcpcb *tp, uint32_t len, uint32_t maxseg, uint32_t mtu, int32_t csum_flags, int32_t tso, uint32_t cts)
 {
 	if (tcp_bblogging_on(tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = tso;
 		log.u_bbr.flex2 = maxseg;
 		log.u_bbr.flex3 = mtu;
 		log.u_bbr.flex4 = csum_flags;
 		TCP_LOG_EVENTP(tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_MSGSIZE, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_flowend(struct tcp_bbr *bbr)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 		struct sockbuf *r, *s;
 		struct timeval tv;
 
 		if (bbr->rc_inp->inp_socket) {
 			r = &bbr->rc_inp->inp_socket->so_rcv;
 			s = &bbr->rc_inp->inp_socket->so_snd;
 		} else {
 			r = s = NULL;
 		}
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, tcp_get_usecs(&tv));
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    r, s,
 		    TCP_LOG_FLOWEND, 0,
 		    0, &log, false, &tv);
 	}
 }
 
 static void
 bbr_log_pkt_epoch(struct tcp_bbr *bbr, uint32_t cts, uint32_t line,
     uint32_t lost, uint32_t del)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = lost;
 		log.u_bbr.flex2 = del;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_bbr_lastbtlbw;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_pkt_epoch_rtt;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_bbr_last_startup_epoch;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_lost_at_startup;
 		log.u_bbr.flex7 = line;
 		log.u_bbr.flex8 = 0;
 		log.u_bbr.inflight = bbr->r_ctl.r_measurement_count;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_PKT_EPOCH, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_time_epoch(struct tcp_bbr *bbr, uint32_t cts, uint32_t line, uint32_t epoch_time)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->r_ctl.rc_lost;
 		log.u_bbr.flex2 = bbr->rc_inp->inp_socket->so_snd.sb_lowat;
 		log.u_bbr.flex3 = bbr->rc_inp->inp_socket->so_snd.sb_hiwat;
 		log.u_bbr.flex7 = line;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TIME_EPOCH, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_set_of_state_target(struct tcp_bbr *bbr, uint32_t new_tar, int line, int meth)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex2 = new_tar;
 		log.u_bbr.flex3 = line;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_pace_max_segs;
 		log.u_bbr.flex5 = bbr_quanta;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_pace_min_segs;
 		log.u_bbr.flex7 = bbr->rc_last_options;
 		log.u_bbr.flex8 = meth;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_STATE_TARGET, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 
 }
 
 static void
 bbr_log_type_statechange(struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_rtt_shrinks;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_probertt_int;
 		if (bbr_state_is_pkt_epoch)
 			log.u_bbr.flex4 = bbr_get_rtt(bbr, BBR_RTT_PKTRTT);
 		else
 			log.u_bbr.flex4 = bbr_get_rtt(bbr, BBR_RTT_PROP);
 		log.u_bbr.flex5 = bbr->r_ctl.rc_bbr_last_startup_epoch;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_lost_at_startup;
 		log.u_bbr.flex7 = (bbr->r_ctl.rc_target_at_state/1000);
 		log.u_bbr.lt_epoch = bbr->r_ctl.rc_level_state_extra;
 		log.u_bbr.pkts_out = bbr->r_ctl.rc_target_at_state;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_STATE, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_rtt_shrinks(struct tcp_bbr *bbr, uint32_t cts, uint32_t applied,
 		    uint32_t rtt, uint32_t line, uint8_t reas, uint16_t cond)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_rtt_shrinks;
 		log.u_bbr.flex3 = bbr->r_ctl.last_in_probertt;
 		log.u_bbr.flex4 = applied;
 		log.u_bbr.flex5 = rtt;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex7 = cond;
 		log.u_bbr.flex8 = reas;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_RTT_SHRINKS, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_exit_rec(struct tcp_bbr *bbr)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = bbr->r_ctl.rc_recovery_start;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_cwnd_on_ent;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_target_at_state;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_EXITREC, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_cwndupd(struct tcp_bbr *bbr, uint32_t bytes_this_ack, uint32_t chg,
     uint32_t prev_acked, int32_t meth, uint32_t target, uint32_t th_ack, int32_t line)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = prev_acked;
 		log.u_bbr.flex3 = bytes_this_ack;
 		log.u_bbr.flex4 = chg;
 		log.u_bbr.flex5 = th_ack;
 		log.u_bbr.flex6 = target;
 		log.u_bbr.flex8 = meth;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_CWND, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_rtt_sample(struct tcp_bbr *bbr, uint32_t rtt, uint32_t tsin)
 {
 	/*
 	 * Log the rtt sample we are applying to the srtt algorithm in
 	 * useconds.
 	 */
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = rtt;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_bbr_state_time;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_ack_hdwr_delay;
 		log.u_bbr.flex4 = bbr->rc_tp->ts_offset;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.pkts_out = tcp_tv_to_mssectick(&bbr->rc_tv);
 		log.u_bbr.flex6 = tsin;
 		log.u_bbr.flex7 = 0;
 		log.u_bbr.flex8 = bbr->rc_ack_was_delayed;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    TCP_LOG_RTT, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_pesist(struct tcp_bbr *bbr, uint32_t cts, uint32_t time_in, int32_t line, uint8_t enter_exit)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = time_in;
 		log.u_bbr.flex2 = line;
 		log.u_bbr.flex8 = enter_exit;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_PERSIST, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 static void
 bbr_log_ack_clear(struct tcp_bbr *bbr, uint32_t cts)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->rc_tp->ts_recent_age;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_rtt_shrinks;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_probertt_int;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_went_idle_time;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_target_at_state;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_ACKCLEAR, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_ack_event(struct tcp_bbr *bbr, struct tcphdr *th, struct tcpopt *to, uint32_t tlen,
 		  uint16_t nsegs, uint32_t cts, int32_t nxt_pkt, struct mbuf *m)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 		struct timeval tv;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = nsegs;
 		log.u_bbr.flex2 = bbr->r_ctl.rc_lost_bytes;
 		if (m) {
 			struct timespec ts;
 
 			log.u_bbr.flex3 = m->m_flags;
 			if (m->m_flags & M_TSTMP) {
 				mbuf_tstmp2timespec(m, &ts);
 				tv.tv_sec = ts.tv_sec;
 				tv.tv_usec = ts.tv_nsec / 1000;
 				log.u_bbr.lt_epoch = tcp_tv_to_usectick(&tv);
 			} else {
 				log.u_bbr.lt_epoch = 0;
 			}
 			if (m->m_flags & M_TSTMP_LRO) {
 				mbuf_tstmp2timeval(m, &tv);
 				log.u_bbr.flex5 = tcp_tv_to_usectick(&tv);
 			} else {
 				/* No arrival timestamp */
 				log.u_bbr.flex5 = 0;
 			}
 
 			log.u_bbr.pkts_out = tcp_get_usecs(&tv);
 		} else {
 			log.u_bbr.flex3 = 0;
 			log.u_bbr.flex5 = 0;
 			log.u_bbr.flex6 = 0;
 			log.u_bbr.pkts_out = 0;
 		}
 		log.u_bbr.flex4 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex7 = bbr->r_wanted_output;
 		log.u_bbr.flex8 = bbr->rc_in_persist;
 		TCP_LOG_EVENTP(bbr->rc_tp, th,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    TCP_LOG_IN, 0,
 		    tlen, &log, true, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_doseg_done(struct tcp_bbr *bbr, uint32_t cts, int32_t nxt_pkt, int32_t did_out)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = did_out;
 		log.u_bbr.flex2 = nxt_pkt;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_last_delay_val;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_hpts_flags;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_timer_exp;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_lost_bytes;
 		log.u_bbr.flex7 = bbr->r_wanted_output;
 		log.u_bbr.flex8 = bbr->rc_in_persist;
 		log.u_bbr.pkts_out = bbr->r_ctl.highest_hdwr_delay;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_DOSEG_DONE, 0,
 		    0, &log, true, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_enobuf_jmp(struct tcp_bbr *bbr, uint32_t len, uint32_t cts,
     int32_t line, uint32_t o_len, uint32_t segcnt, uint32_t segsiz)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = o_len;
 		log.u_bbr.flex3 = segcnt;
 		log.u_bbr.flex4 = segsiz;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_ENOBUF_JMP, ENOBUFS,
 		    len, &log, true, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_to_processing(struct tcp_bbr *bbr, uint32_t cts, int32_t ret, int32_t timers, uint8_t hpts_calling)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = timers;
 		log.u_bbr.flex2 = ret;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_timer_exp;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_hpts_flags;
 		log.u_bbr.flex5 = cts;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex8 = hpts_calling;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TO_PROCESS, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_to_event(struct tcp_bbr *bbr, uint32_t cts, int32_t to_num)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 		uint64_t ar;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->bbr_timer_src;
 		log.u_bbr.flex2 = 0;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_hpts_flags;
 		ar = (uint64_t)(bbr->r_ctl.rc_resend);
 		ar >>= 32;
 		ar &= 0x00000000ffffffff;
 		log.u_bbr.flex4 = (uint32_t)ar;
 		ar = (uint64_t)bbr->r_ctl.rc_resend;
 		ar &= 0x00000000ffffffff;
 		log.u_bbr.flex5 = (uint32_t)ar;
 		log.u_bbr.flex6 = TICKS_2_USEC(bbr->rc_tp->t_rxtcur);
 		log.u_bbr.flex8 = to_num;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_RTO, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_startup_event(struct tcp_bbr *bbr, uint32_t cts, uint32_t flex1, uint32_t flex2, uint32_t flex3, uint8_t reason)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = flex1;
 		log.u_bbr.flex2 = flex2;
 		log.u_bbr.flex3 = flex3;
 		log.u_bbr.flex4 = 0;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_lost_at_startup;
 		log.u_bbr.flex8 = reason;
 		log.u_bbr.cur_del_rate = bbr->r_ctl.rc_bbr_lastbtlbw;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_REDUCE, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_hpts_diag(struct tcp_bbr *bbr, uint32_t cts, struct hpts_diag *diag)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = diag->p_nxt_slot;
 		log.u_bbr.flex2 = diag->p_cur_slot;
 		log.u_bbr.flex3 = diag->slot_req;
 		log.u_bbr.flex4 = diag->inp_hptsslot;
 		log.u_bbr.flex5 = diag->slot_remaining;
 		log.u_bbr.flex6 = diag->need_new_to;
 		log.u_bbr.flex7 = diag->p_hpts_active;
 		log.u_bbr.flex8 = diag->p_on_min_sleep;
 		/* Hijack other fields as needed  */
 		log.u_bbr.epoch = diag->have_slept;
 		log.u_bbr.lt_epoch = diag->yet_to_sleep;
 		log.u_bbr.pkts_out = diag->co_ret;
 		log.u_bbr.applimited = diag->hpts_sleep_time;
 		log.u_bbr.delivered = diag->p_prev_slot;
 		log.u_bbr.inflight = diag->p_runningslot;
 		log.u_bbr.bw_inuse = diag->wheel_slot;
 		log.u_bbr.rttProp = diag->wheel_cts;
 		log.u_bbr.delRate = diag->maxslots;
 		log.u_bbr.cur_del_rate = diag->p_curtick;
 		log.u_bbr.cur_del_rate <<= 32;
 		log.u_bbr.cur_del_rate |= diag->p_lasttick;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_HPTSDIAG, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_timer_var(struct tcp_bbr *bbr, int mode, uint32_t cts, uint32_t time_since_sent, uint32_t srtt,
     uint32_t thresh, uint32_t to)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->rc_tp->t_rttvar;
 		log.u_bbr.flex2 = time_since_sent;
 		log.u_bbr.flex3 = srtt;
 		log.u_bbr.flex4 = thresh;
 		log.u_bbr.flex5 = to;
 		log.u_bbr.flex6 = bbr->rc_tp->t_srtt;
 		log.u_bbr.flex8 = mode;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TIMERPREP, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_pacing_delay_calc(struct tcp_bbr *bbr, uint16_t gain, uint32_t len,
     uint32_t cts, uint32_t usecs, uint64_t bw, uint32_t override, int mod)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = usecs;
 		log.u_bbr.flex2 = len;
 		log.u_bbr.flex3 = (uint32_t)((bw >> 32) & 0x00000000ffffffff);
 		log.u_bbr.flex4 = (uint32_t)(bw & 0x00000000ffffffff);
 		if (override)
 			log.u_bbr.flex5 = (1 << 2);
 		else
 			log.u_bbr.flex5 = 0;
 		log.u_bbr.flex6 = override;
 		log.u_bbr.flex7 = gain;
 		log.u_bbr.flex8 = mod;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_HPTSI_CALC, 0,
 		    len, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_to_start(struct tcp_bbr *bbr, uint32_t cts, uint32_t to, int32_t slot, uint8_t which)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 
 		log.u_bbr.flex1 = bbr->bbr_timer_src;
 		log.u_bbr.flex2 = to;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_hpts_flags;
 		log.u_bbr.flex4 = slot;
 		log.u_bbr.flex5 = bbr->rc_tp->t_hpts_slot;
 		log.u_bbr.flex6 = TICKS_2_USEC(bbr->rc_tp->t_rxtcur);
 		log.u_bbr.pkts_out = bbr->rc_tp->t_flags2;
 		log.u_bbr.flex8 = which;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TIMERSTAR, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_thresh_choice(struct tcp_bbr *bbr, uint32_t cts, uint32_t thresh, uint32_t lro, uint32_t srtt, struct bbr_sendmap *rsm, uint8_t frm)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = thresh;
 		log.u_bbr.flex2 = lro;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_reorder_ts;
 		log.u_bbr.flex4 = rsm->r_tim_lastsent[(rsm->r_rtr_cnt - 1)];
 		log.u_bbr.flex5 = TICKS_2_USEC(bbr->rc_tp->t_rxtcur);
 		log.u_bbr.flex6 = srtt;
 		log.u_bbr.flex7 = bbr->r_ctl.rc_reorder_shift;
 		log.u_bbr.flex8 = frm;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_THRESH_CALC, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_to_cancel(struct tcp_bbr *bbr, int32_t line, uint32_t cts, uint8_t hpts_removed)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = bbr->bbr_timer_src;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_hpts_flags;
 		log.u_bbr.flex4 = bbr->rc_in_persist;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex6 = TICKS_2_USEC(bbr->rc_tp->t_rxtcur);
 		log.u_bbr.flex8 = hpts_removed;
 		log.u_bbr.pkts_out = bbr->rc_pacer_started;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TIMERCANC, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_tstmp_validation(struct tcp_bbr *bbr, uint64_t peer_delta, uint64_t delta)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = bbr->r_ctl.bbr_peer_tsratio;
 		log.u_bbr.flex2 = (peer_delta >> 32);
 		log.u_bbr.flex3 = (peer_delta & 0x00000000ffffffff);
 		log.u_bbr.flex4 = (delta >> 32);
 		log.u_bbr.flex5 = (delta & 0x00000000ffffffff);
 		log.u_bbr.flex7 = bbr->rc_ts_clock_set;
 		log.u_bbr.flex8 = bbr->rc_ts_cant_be_used;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_TSTMP_VAL, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_tsosize(struct tcp_bbr *bbr, uint32_t cts, uint32_t tsosz, uint32_t tls, uint32_t old_val, uint32_t maxseg, int hdwr)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = tsosz;
 		log.u_bbr.flex2 = tls;
 		log.u_bbr.flex3 = tcp_min_hptsi_time;
 		log.u_bbr.flex4 = bbr->r_ctl.bbr_hptsi_bytes_min;
 		log.u_bbr.flex5 = old_val;
 		log.u_bbr.flex6 = maxseg;
 		log.u_bbr.flex7 = bbr->rc_no_pacing;
 		log.u_bbr.flex7 <<= 1;
 		log.u_bbr.flex7 |= bbr->rc_past_init_win;
 		if (hdwr)
 			log.u_bbr.flex8 = 0x80 | bbr->rc_use_google;
 		else
 			log.u_bbr.flex8 = bbr->rc_use_google;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BBRTSO, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_rsmclear(struct tcp_bbr *bbr, uint32_t cts, struct bbr_sendmap *rsm,
 		      uint32_t flags, uint32_t line)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = rsm->r_start;
 		log.u_bbr.flex3 = rsm->r_end;
 		log.u_bbr.flex4 = rsm->r_delivered;
 		log.u_bbr.flex5 = rsm->r_rtr_cnt;
 		log.u_bbr.flex6 = rsm->r_dupack;
 		log.u_bbr.flex7 = rsm->r_tim_lastsent[0];
 		log.u_bbr.flex8 = rsm->r_flags;
 		/* Hijack the pkts_out fids */
 		log.u_bbr.applimited = flags;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_RSM_CLEARED, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_bbrupd(struct tcp_bbr *bbr, uint8_t flex8, uint32_t cts,
     uint32_t flex3, uint32_t flex2, uint32_t flex5,
     uint32_t flex6, uint32_t pkts_out, int flex7,
     uint32_t flex4, uint32_t flex1)
 {
 
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = flex1;
 		log.u_bbr.flex2 = flex2;
 		log.u_bbr.flex3 = flex3;
 		log.u_bbr.flex4 = flex4;
 		log.u_bbr.flex5 = flex5;
 		log.u_bbr.flex6 = flex6;
 		log.u_bbr.flex7 = flex7;
 		/* Hijack the pkts_out fids */
 		log.u_bbr.pkts_out = pkts_out;
 		log.u_bbr.flex8 = flex8;
 		if (bbr->rc_ack_was_delayed)
 			log.u_bbr.epoch = bbr->r_ctl.rc_ack_hdwr_delay;
 		else
 			log.u_bbr.epoch = 0;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BBRUPD, 0,
 		    flex2, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_ltbw(struct tcp_bbr *bbr, uint32_t cts, int32_t reason,
 	uint32_t newbw, uint32_t obw, uint32_t diff,
 	uint32_t tim)
 {
 	if (/*bbr_verbose_logging && */tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = reason;
 		log.u_bbr.flex2 = newbw;
 		log.u_bbr.flex3 = obw;
 		log.u_bbr.flex4 = diff;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_lt_lost;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_lt_del;
 		log.u_bbr.flex7 = bbr->rc_lt_is_sampling;
 		log.u_bbr.pkts_out = tim;
 		log.u_bbr.bw_inuse = bbr->r_ctl.rc_lt_bw;
 		if (bbr->rc_lt_use_bw == 0)
 			log.u_bbr.epoch = bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_lt_epoch;
 		else
 			log.u_bbr.epoch = bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_lt_epoch_use;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BWSAMP, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static inline void
 bbr_log_progress_event(struct tcp_bbr *bbr, struct tcpcb *tp, uint32_t tick, int event, int line)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		log.u_bbr.flex1 = line;
 		log.u_bbr.flex2 = tick;
 		log.u_bbr.flex3 = tp->t_maxunacktime;
 		log.u_bbr.flex4 = tp->t_acktime;
 		log.u_bbr.flex8 = event;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_PROGRESS, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_type_log_hdwr_pacing(struct tcp_bbr *bbr, const struct ifnet *ifp,
 			 uint64_t rate, uint64_t hw_rate, int line, uint32_t cts,
 			 int error)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = ((hw_rate >> 32) & 0x00000000ffffffff);
 		log.u_bbr.flex2 = (hw_rate & 0x00000000ffffffff);
 		log.u_bbr.flex3 = (((uint64_t)ifp  >> 32) & 0x00000000ffffffff);
 		log.u_bbr.flex4 = ((uint64_t)ifp & 0x00000000ffffffff);
 		log.u_bbr.bw_inuse = rate;
 		log.u_bbr.flex5 = line;
 		log.u_bbr.flex6 = error;
 		log.u_bbr.flex8 = bbr->skip_gain;
 		log.u_bbr.flex8 <<= 1;
 		log.u_bbr.flex8 |= bbr->gain_is_limited;
 		log.u_bbr.flex8 <<= 1;
 		log.u_bbr.flex8 |= bbr->bbr_hdrw_pacing;
 		log.u_bbr.pkts_out = bbr->rc_tp->t_maxseg;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_HDWR_PACE, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_bbrsnd(struct tcp_bbr *bbr, uint32_t len, uint32_t slot, uint32_t del_by, uint32_t cts, uint32_t line, uint32_t prev_delay)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = slot;
 		log.u_bbr.flex2 = del_by;
 		log.u_bbr.flex3 = prev_delay;
 		log.u_bbr.flex4 = line;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_last_delay_val;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_hptsi_agg_delay;
 		log.u_bbr.flex7 = (0x0000ffff & bbr->r_ctl.rc_hpts_flags);
 		log.u_bbr.flex8 = bbr->rc_in_persist;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BBRSND, 0,
 		    len, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_type_bbrrttprop(struct tcp_bbr *bbr, uint32_t t, uint32_t end, uint32_t tsconv, uint32_t cts, int32_t match, uint32_t seq, uint8_t flags)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->r_ctl.rc_delivered;
 		log.u_bbr.flex2 = 0;
 		log.u_bbr.flex3 = bbr->r_ctl.rc_lowest_rtt;
 		log.u_bbr.flex4 = end;
 		log.u_bbr.flex5 = seq;
 		log.u_bbr.flex6 = t;
 		log.u_bbr.flex7 = match;
 		log.u_bbr.flex8 = flags;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_BBRRTT, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_exit_gain(struct tcp_bbr *bbr, uint32_t cts, int32_t entry_method)
 {
 	if (tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		log.u_bbr.flex1 = bbr->r_ctl.rc_target_at_state;
 		log.u_bbr.flex2 = (bbr->rc_tp->t_maxseg - bbr->rc_last_options);
 		log.u_bbr.flex3 = bbr->r_ctl.gain_epoch;
 		log.u_bbr.flex4 = bbr->r_ctl.rc_pace_max_segs;
 		log.u_bbr.flex5 = bbr->r_ctl.rc_pace_min_segs;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_bbr_state_atflight;
 		log.u_bbr.flex7 = 0;
 		log.u_bbr.flex8 = entry_method;
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_EXIT_GAIN, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 static void
 bbr_log_settings_change(struct tcp_bbr *bbr, int settings_desired)
 {
 	if (bbr_verbose_logging && tcp_bblogging_on(bbr->rc_tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, bbr->r_ctl.rc_rcvtime);
 		/* R-HU */
 		log.u_bbr.flex1 = 0;
 		log.u_bbr.flex2 = 0;
 		log.u_bbr.flex3 = 0;
 		log.u_bbr.flex4 = 0;
 		log.u_bbr.flex7 = 0;
 		log.u_bbr.flex8 = settings_desired;
 
 		TCP_LOG_EVENTP(bbr->rc_tp, NULL,
 		    &bbr->rc_inp->inp_socket->so_rcv,
 		    &bbr->rc_inp->inp_socket->so_snd,
 		    BBR_LOG_SETTINGS_CHG, 0,
 		    0, &log, false, &bbr->rc_tv);
 	}
 }
 
 /*
  * Returns the bw from the our filter.
  */
 static inline uint64_t
 bbr_get_full_bw(struct tcp_bbr *bbr)
 {
 	uint64_t bw;
 
 	bw = get_filter_value(&bbr->r_ctl.rc_delrate);
 
 	return (bw);
 }
 
 static inline void
 bbr_set_pktepoch(struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	uint64_t calclr;
 	uint32_t lost, del;
 
 	if (bbr->r_ctl.rc_lost > bbr->r_ctl.rc_lost_at_pktepoch)
 		lost = bbr->r_ctl.rc_lost - bbr->r_ctl.rc_lost_at_pktepoch;
 	else
 		lost = 0;
 	del = bbr->r_ctl.rc_delivered - bbr->r_ctl.rc_pkt_epoch_del;
 	if (lost == 0)  {
 		calclr = 0;
 	} else if (del) {
 		calclr = lost;
 		calclr *= (uint64_t)1000;
 		calclr /= (uint64_t)del;
 	} else {
 		/* Nothing delivered? 100.0% loss */
 		calclr = 1000;
 	}
 	bbr->r_ctl.rc_pkt_epoch_loss_rate =  (uint32_t)calclr;
 	if (IN_RECOVERY(bbr->rc_tp->t_flags))
 		bbr->r_ctl.recovery_lr += (uint32_t)calclr;
 	bbr->r_ctl.rc_pkt_epoch++;
 	if (bbr->rc_no_pacing &&
 	    (bbr->r_ctl.rc_pkt_epoch >= bbr->no_pacing_until)) {
 		bbr->rc_no_pacing = 0;
 		tcp_bbr_tso_size_check(bbr, cts);
 	}
 	bbr->r_ctl.rc_pkt_epoch_rtt = bbr_calc_time(cts, bbr->r_ctl.rc_pkt_epoch_time);
 	bbr->r_ctl.rc_pkt_epoch_time = cts;
 	/* What was our loss rate */
 	bbr_log_pkt_epoch(bbr, cts, line, lost, del);
 	bbr->r_ctl.rc_pkt_epoch_del = bbr->r_ctl.rc_delivered;
 	bbr->r_ctl.rc_lost_at_pktepoch = bbr->r_ctl.rc_lost;
 }
 
 static inline void
 bbr_set_epoch(struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	uint32_t epoch_time;
 
 	/* Tick the RTT clock */
 	bbr->r_ctl.rc_rtt_epoch++;
 	epoch_time = cts - bbr->r_ctl.rc_rcv_epoch_start;
 	bbr_log_time_epoch(bbr, cts, line, epoch_time);
 	bbr->r_ctl.rc_rcv_epoch_start = cts;
 }
 
 static inline void
 bbr_isit_a_pkt_epoch(struct tcp_bbr *bbr, uint32_t cts, struct bbr_sendmap *rsm, int32_t line, int32_t cum_acked)
 {
 	if (SEQ_GEQ(rsm->r_delivered, bbr->r_ctl.rc_pkt_epoch_del)) {
 		bbr->rc_is_pkt_epoch_now = 1;
 	}
 }
 
 /*
  * Returns the bw from either the b/w filter
  * or from the lt_bw (if the connection is being
  * policed).
  */
 static inline uint64_t
 __bbr_get_bw(struct tcp_bbr *bbr)
 {
 	uint64_t bw, min_bw;
 	uint64_t rtt;
 	int gm_measure_cnt = 1;
 
 	/*
 	 * For startup we make, like google, a
 	 * minimum b/w. This is generated from the
 	 * IW and the rttProp. We do fall back to srtt
 	 * if for some reason (initial handshake) we don't
 	 * have a rttProp. We, in the worst case, fall back
 	 * to the configured min_bw (rc_initial_hptsi_bw).
 	 */
 	if (bbr->rc_bbr_state == BBR_STATE_STARTUP) {
 		/* Attempt first to use rttProp */
 		rtt = (uint64_t)get_filter_value_small(&bbr->r_ctl.rc_rttprop);
 		if (rtt && (rtt < 0xffffffff)) {
 measure:
 			min_bw = (uint64_t)(bbr_initial_cwnd(bbr, bbr->rc_tp)) *
 				((uint64_t)1000000);
 			min_bw /= rtt;
 			if (min_bw < bbr->r_ctl.rc_initial_hptsi_bw) {
 				min_bw = bbr->r_ctl.rc_initial_hptsi_bw;
 			}
 
 		} else if (bbr->rc_tp->t_srtt != 0) {
 			/* No rttProp, use srtt? */
 			rtt = bbr_get_rtt(bbr, BBR_SRTT);
 			goto measure;
 		} else {
 			min_bw = bbr->r_ctl.rc_initial_hptsi_bw;
 		}
 	} else
 		min_bw = 0;
 
 	if ((bbr->rc_past_init_win == 0) &&
 	    (bbr->r_ctl.rc_delivered > bbr_initial_cwnd(bbr, bbr->rc_tp)))
 		bbr->rc_past_init_win = 1;
 	if ((bbr->rc_use_google)  && (bbr->r_ctl.r_measurement_count >= 1))
 		gm_measure_cnt = 0;
 	if (gm_measure_cnt &&
 	    ((bbr->r_ctl.r_measurement_count < bbr_min_measurements_req) ||
 	     (bbr->rc_past_init_win == 0))) {
 		/* For google we use our guess rate until we get 1 measurement */
 
 use_initial_window:
 		rtt = (uint64_t)get_filter_value_small(&bbr->r_ctl.rc_rttprop);
 		if (rtt && (rtt < 0xffffffff)) {
 			/*
 			 * We have an RTT measurement. Use that in
 			 * combination with our initial window to calculate
 			 * a b/w.
 			 */
 			bw = (uint64_t)(bbr_initial_cwnd(bbr, bbr->rc_tp)) *
 				((uint64_t)1000000);
 			bw /= rtt;
 			if (bw < bbr->r_ctl.rc_initial_hptsi_bw) {
 				bw = bbr->r_ctl.rc_initial_hptsi_bw;
 			}
 		} else {
 			/* Drop back to the 40 and punt to a default */
 			bw = bbr->r_ctl.rc_initial_hptsi_bw;
 		}
 		if (bw < 1)
 			/* Probably should panic */
 			bw = 1;
 		if (bw > min_bw)
 			return (bw);
 		else
 			return (min_bw);
 	}
 	if (bbr->rc_lt_use_bw)
 		bw = bbr->r_ctl.rc_lt_bw;
 	else if (bbr->r_recovery_bw && (bbr->rc_use_google == 0))
 		bw = bbr->r_ctl.red_bw;
 	else
 		bw = get_filter_value(&bbr->r_ctl.rc_delrate);
 	if (bw == 0) {
 		/* We should not be at 0, go to the initial window then  */
 		goto use_initial_window;
 	}
 	if (bw < 1)
 		/* Probably should panic */
 		bw = 1;
 	if (bw < min_bw)
 		bw = min_bw;
 	return (bw);
 }
 
 static inline uint64_t
 bbr_get_bw(struct tcp_bbr *bbr)
 {
 	uint64_t bw;
 
 	bw = __bbr_get_bw(bbr);
 	return (bw);
 }
 
 static inline void
 bbr_reset_lt_bw_interval(struct tcp_bbr *bbr, uint32_t cts)
 {
 	bbr->r_ctl.rc_lt_epoch = bbr->r_ctl.rc_pkt_epoch;
 	bbr->r_ctl.rc_lt_time = bbr->r_ctl.rc_del_time;
 	bbr->r_ctl.rc_lt_del = bbr->r_ctl.rc_delivered;
 	bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 }
 
 static inline void
 bbr_reset_lt_bw_sampling(struct tcp_bbr *bbr, uint32_t cts)
 {
 	bbr->rc_lt_is_sampling = 0;
 	bbr->rc_lt_use_bw = 0;
 	bbr->r_ctl.rc_lt_bw = 0;
 	bbr_reset_lt_bw_interval(bbr, cts);
 }
 
 static inline void
 bbr_lt_bw_samp_done(struct tcp_bbr *bbr, uint64_t bw, uint32_t cts, uint32_t timin)
 {
 	uint64_t diff;
 
 	/* Do we have a previous sample? */
 	if (bbr->r_ctl.rc_lt_bw) {
 		/* Get the diff in bytes per second */
 		if (bbr->r_ctl.rc_lt_bw > bw)
 			diff = bbr->r_ctl.rc_lt_bw - bw;
 		else
 			diff = bw - bbr->r_ctl.rc_lt_bw;
 		if ((diff <= bbr_lt_bw_diff) ||
 		    (diff <= (bbr->r_ctl.rc_lt_bw / bbr_lt_bw_ratio))) {
 			/* Consider us policed */
 			uint32_t saved_bw;
 
 			saved_bw = (uint32_t)bbr->r_ctl.rc_lt_bw;
 			bbr->r_ctl.rc_lt_bw = (bw + bbr->r_ctl.rc_lt_bw) / 2;	/* average of two */
 			bbr->rc_lt_use_bw = 1;
 			bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 			/*
 			 * Use pkt based epoch for measuring length of
 			 * policer up
 			 */
 			bbr->r_ctl.rc_lt_epoch_use = bbr->r_ctl.rc_pkt_epoch;
 			/*
 			 * reason 4 is we need to start consider being
 			 * policed
 			 */
 			bbr_log_type_ltbw(bbr, cts, 4, (uint32_t)bw, saved_bw, (uint32_t)diff, timin);
 			return;
 		}
 	}
 	bbr->r_ctl.rc_lt_bw = bw;
 	bbr_reset_lt_bw_interval(bbr, cts);
 	bbr_log_type_ltbw(bbr, cts, 5, 0, (uint32_t)bw, 0, timin);
 }
 
 static void
 bbr_randomize_extra_state_time(struct tcp_bbr *bbr)
 {
 	uint32_t ran, deduct;
 
 	ran = arc4random_uniform(bbr_rand_ot);
 	if (ran) {
 		deduct = bbr->r_ctl.rc_level_state_extra / ran;
 		bbr->r_ctl.rc_level_state_extra -= deduct;
 	}
 }
 /*
  * Return randomly the starting state
  * to use in probebw.
  */
 static uint8_t
 bbr_pick_probebw_substate(struct tcp_bbr *bbr, uint32_t cts)
 {
 	uint32_t ran;
 	uint8_t ret_val;
 
 	/* Initialize the offset to 0 */
 	bbr->r_ctl.rc_exta_time_gd = 0;
 	bbr->rc_hit_state_1 = 0;
 	bbr->r_ctl.rc_level_state_extra = 0;
 	ran = arc4random_uniform((BBR_SUBSTATE_COUNT-1));
 	/*
 	 * The math works funny here :) the return value is used to set the
 	 * substate and then the state change is called which increments by
 	 * one. So if we return 1 (DRAIN) we will increment to 2 (LEVEL1) when
 	 * we fully enter the state. Note that the (8 - 1 - ran) assures that
 	 * we return 1 - 7, so we dont return 0 and end up starting in
 	 * state 1 (DRAIN).
 	 */
 	ret_val = BBR_SUBSTATE_COUNT - 1 - ran;
 	/* Set an epoch */
 	if ((cts - bbr->r_ctl.rc_rcv_epoch_start) >= bbr_get_rtt(bbr, BBR_RTT_PROP))
 		bbr_set_epoch(bbr, cts, __LINE__);
 
 	bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 	return (ret_val);
 }
 
 static void
 bbr_lt_bw_sampling(struct tcp_bbr *bbr, uint32_t cts, int32_t loss_detected)
 {
 	uint32_t diff, d_time;
 	uint64_t del_time, bw, lost, delivered;
 
 	if (bbr->r_use_policer == 0)
 		return;
 	if (bbr->rc_lt_use_bw) {
 		/* We are using lt bw do we stop yet? */
 		diff = bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_lt_epoch_use;
 		if (diff > bbr_lt_bw_max_rtts) {
 			/* Reset it all */
 reset_all:
 			bbr_reset_lt_bw_sampling(bbr, cts);
 			if (bbr->rc_filled_pipe) {
 				bbr_set_epoch(bbr, cts, __LINE__);
 				bbr->rc_bbr_substate = bbr_pick_probebw_substate(bbr, cts);
 				bbr_substate_change(bbr, cts, __LINE__, 0);
 				bbr->rc_bbr_state = BBR_STATE_PROBE_BW;
 				bbr_log_type_statechange(bbr, cts, __LINE__);
 			} else {
 				/*
 				 * This should not happen really
 				 * unless we remove the startup/drain
 				 * restrictions above.
 				 */
 				bbr->rc_bbr_state = BBR_STATE_STARTUP;
 				bbr_set_epoch(bbr, cts, __LINE__);
 				bbr->r_ctl.rc_bbr_state_time = cts;
 				bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 				bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.rc_startup_pg;
 				bbr->r_ctl.rc_bbr_cwnd_gain = bbr->r_ctl.rc_startup_pg;
 				bbr_set_state_target(bbr, __LINE__);
 				bbr_log_type_statechange(bbr, cts, __LINE__);
 			}
 			/* reason 0 is to stop using lt-bw */
 			bbr_log_type_ltbw(bbr, cts, 0, 0, 0, 0, 0);
 			return;
 		}
 		if (bbr_lt_intvl_fp == 0) {
 			/* Not doing false-positive detection */
 			return;
 		}
 		/* False positive detection */
 		if (diff == bbr_lt_intvl_fp) {
 			/* At bbr_lt_intvl_fp we record the lost */
 			bbr->r_ctl.rc_lt_del = bbr->r_ctl.rc_delivered;
 			bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 		} else if (diff > (bbr_lt_intvl_min_rtts + bbr_lt_intvl_fp)) {
 			/* Now is our loss rate still high? */
 			lost = bbr->r_ctl.rc_lost - bbr->r_ctl.rc_lt_lost;
 			delivered = bbr->r_ctl.rc_delivered - bbr->r_ctl.rc_lt_del;
 			if ((delivered == 0) ||
 			    (((lost * 1000)/delivered) < bbr_lt_fd_thresh)) {
 				/* No still below our threshold */
 				bbr_log_type_ltbw(bbr, cts, 7, lost, delivered, 0, 0);
 			} else {
 				/* Yikes its still high, it must be a false positive */
 				bbr_log_type_ltbw(bbr, cts, 8, lost, delivered, 0, 0);
 				goto reset_all;
 			}
 		}
 		return;
 	}
 	/*
 	 * Wait for the first loss before sampling, to let the policer
 	 * exhaust its tokens and estimate the steady-state rate allowed by
 	 * the policer. Starting samples earlier includes bursts that
 	 * over-estimate the bw.
 	 */
 	if (bbr->rc_lt_is_sampling == 0) {
 		/* reason 1 is to begin doing the sampling  */
 		if (loss_detected == 0)
 			return;
 		bbr_reset_lt_bw_interval(bbr, cts);
 		bbr->rc_lt_is_sampling = 1;
 		bbr_log_type_ltbw(bbr, cts, 1, 0, 0, 0, 0);
 		return;
 	}
 	/* Now how long were we delivering long term last> */
 	if (TSTMP_GEQ(bbr->r_ctl.rc_del_time, bbr->r_ctl.rc_lt_time))
 		d_time = bbr->r_ctl.rc_del_time - bbr->r_ctl.rc_lt_time;
 	else
 		d_time = 0;
 
 	/* To avoid underestimates, reset sampling if we run out of data. */
 	if (bbr->r_ctl.r_app_limited_until) {
 		/* Can not measure in app-limited state */
 		bbr_reset_lt_bw_sampling(bbr, cts);
 		/* reason 2 is to reset sampling due to app limits  */
 		bbr_log_type_ltbw(bbr, cts, 2, 0, 0, 0, d_time);
 		return;
 	}
 	diff = bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_lt_epoch;
 	if (diff < bbr_lt_intvl_min_rtts) {
 		/*
 		 * need more samples (we don't
 		 * start on a round like linux so
 		 * we need 1 more).
 		 */
 		/* 6 is not_enough time or no-loss */
 		bbr_log_type_ltbw(bbr, cts, 6, 0, 0, 0, d_time);
 		return;
 	}
 	if (diff > (4 * bbr_lt_intvl_min_rtts)) {
 		/*
 		 * For now if we wait too long, reset all sampling. We need
 		 * to do some research here, its possible that we should
 		 * base this on how much loss as occurred.. something like
 		 * if its under 10% (or some thresh) reset all otherwise
 		 * don't.  Thats for phase II I guess.
 		 */
 		bbr_reset_lt_bw_sampling(bbr, cts);
  		/* reason 3 is to reset sampling due too long of sampling */
 		bbr_log_type_ltbw(bbr, cts, 3, 0, 0, 0, d_time);
 		return;
 	}
 	/*
 	 * End sampling interval when a packet is lost, so we estimate the
 	 * policer tokens were exhausted. Stopping the sampling before the
 	 * tokens are exhausted under-estimates the policed rate.
 	 */
 	if (loss_detected == 0) {
 		/* 6 is not_enough time or no-loss */
 		bbr_log_type_ltbw(bbr, cts, 6, 0, 0, 0, d_time);
 		return;
 	}
 	/* Calculate packets lost and delivered in sampling interval. */
 	lost = bbr->r_ctl.rc_lost - bbr->r_ctl.rc_lt_lost;
 	delivered = bbr->r_ctl.rc_delivered - bbr->r_ctl.rc_lt_del;
 	if ((delivered == 0) ||
 	    (((lost * 1000)/delivered) < bbr_lt_loss_thresh)) {
 		bbr_log_type_ltbw(bbr, cts, 6, lost, delivered, 0, d_time);
 		return;
 	}
 	if (d_time < 1000) {
 		/* Not enough time. wait */
 		/* 6 is not_enough time or no-loss */
 		bbr_log_type_ltbw(bbr, cts, 6, 0, 0, 0, d_time);
 		return;
 	}
 	if (d_time >= (0xffffffff / USECS_IN_MSEC)) {
 		/* Too long */
 		bbr_reset_lt_bw_sampling(bbr, cts);
  		/* reason 3 is to reset sampling due too long of sampling */
 		bbr_log_type_ltbw(bbr, cts, 3, 0, 0, 0, d_time);
 		return;
 	}
 	del_time = d_time;
 	bw = delivered;
 	bw *= (uint64_t)USECS_IN_SECOND;
 	bw /= del_time;
 	bbr_lt_bw_samp_done(bbr, bw, cts, d_time);
 }
 
 /*
  * Allocate a sendmap from our zone.
  */
 static struct bbr_sendmap *
 bbr_alloc(struct tcp_bbr *bbr)
 {
 	struct bbr_sendmap *rsm;
 
 	BBR_STAT_INC(bbr_to_alloc);
 	rsm = uma_zalloc(bbr_zone, (M_NOWAIT | M_ZERO));
 	if (rsm) {
 		bbr->r_ctl.rc_num_maps_alloced++;
 		return (rsm);
 	}
 	if (bbr->r_ctl.rc_free_cnt) {
 		BBR_STAT_INC(bbr_to_alloc_emerg);
 		rsm = TAILQ_FIRST(&bbr->r_ctl.rc_free);
 		TAILQ_REMOVE(&bbr->r_ctl.rc_free, rsm, r_next);
 		bbr->r_ctl.rc_free_cnt--;
 		return (rsm);
 	}
 	BBR_STAT_INC(bbr_to_alloc_failed);
 	return (NULL);
 }
 
 static struct bbr_sendmap *
 bbr_alloc_full_limit(struct tcp_bbr *bbr)
 {
 	if ((V_tcp_map_entries_limit > 0) &&
 	    (bbr->r_ctl.rc_num_maps_alloced >= V_tcp_map_entries_limit)) {
 		BBR_STAT_INC(bbr_alloc_limited);
 		if (!bbr->alloc_limit_reported) {
 			bbr->alloc_limit_reported = 1;
 			BBR_STAT_INC(bbr_alloc_limited_conns);
 		}
 		return (NULL);
 	}
 	return (bbr_alloc(bbr));
 }
 
 /* wrapper to allocate a sendmap entry, subject to a specific limit */
 static struct bbr_sendmap *
 bbr_alloc_limit(struct tcp_bbr *bbr, uint8_t limit_type)
 {
 	struct bbr_sendmap *rsm;
 
 	if (limit_type) {
 		/* currently there is only one limit type */
 		if (V_tcp_map_split_limit > 0 &&
 		    bbr->r_ctl.rc_num_split_allocs >= V_tcp_map_split_limit) {
 			BBR_STAT_INC(bbr_split_limited);
 			if (!bbr->alloc_limit_reported) {
 				bbr->alloc_limit_reported = 1;
 				BBR_STAT_INC(bbr_alloc_limited_conns);
 			}
 			return (NULL);
 		}
 	}
 
 	/* allocate and mark in the limit type, if set */
 	rsm = bbr_alloc(bbr);
 	if (rsm != NULL && limit_type) {
 		rsm->r_limit_type = limit_type;
 		bbr->r_ctl.rc_num_split_allocs++;
 	}
 	return (rsm);
 }
 
 static void
 bbr_free(struct tcp_bbr *bbr, struct bbr_sendmap *rsm)
 {
 	if (rsm->r_limit_type) {
 		/* currently there is only one limit type */
 		bbr->r_ctl.rc_num_split_allocs--;
 	}
 	if (rsm->r_is_smallmap)
 		bbr->r_ctl.rc_num_small_maps_alloced--;
 	if (bbr->r_ctl.rc_tlp_send == rsm)
 		bbr->r_ctl.rc_tlp_send = NULL;
 	if (bbr->r_ctl.rc_resend == rsm) {
 		bbr->r_ctl.rc_resend = NULL;
 	}
 	if (bbr->r_ctl.rc_next == rsm)
 		bbr->r_ctl.rc_next = NULL;
 	if (bbr->r_ctl.rc_sacklast == rsm)
 		bbr->r_ctl.rc_sacklast = NULL;
 	if (bbr->r_ctl.rc_free_cnt < bbr_min_req_free) {
 		memset(rsm, 0, sizeof(struct bbr_sendmap));
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_free, rsm, r_next);
 		rsm->r_limit_type = 0;
 		bbr->r_ctl.rc_free_cnt++;
 		return;
 	}
 	bbr->r_ctl.rc_num_maps_alloced--;
 	uma_zfree(bbr_zone, rsm);
 }
 
 /*
  * Returns the BDP.
  */
 static uint64_t
 bbr_get_bw_delay_prod(uint64_t rtt, uint64_t bw) {
 	/*
 	 * Calculate the bytes in flight needed given the bw (in bytes per
 	 * second) and the specifyed rtt in useconds. We need to put out the
 	 * returned value per RTT to match that rate. Gain will normally
 	 * raise it up from there.
 	 *
 	 * This should not overflow as long as the bandwidth is below 1
 	 * TByte per second (bw < 10**12 = 2**40) and the rtt is smaller
 	 * than 1000 seconds (rtt < 10**3 * 10**6 = 10**9 = 2**30).
 	 */
 	uint64_t usec_per_sec;
 
 	usec_per_sec = USECS_IN_SECOND;
 	return ((rtt * bw) / usec_per_sec);
 }
 
 /*
  * Return the initial cwnd.
  */
 static uint32_t
 bbr_initial_cwnd(struct tcp_bbr *bbr, struct tcpcb *tp)
 {
 	uint32_t i_cwnd;
 
 	if (bbr->rc_init_win) {
 		i_cwnd = bbr->rc_init_win * tp->t_maxseg;
 	} else if (V_tcp_initcwnd_segments)
 		i_cwnd = min((V_tcp_initcwnd_segments * tp->t_maxseg),
 		    max(2 * tp->t_maxseg, 14600));
 	else if (V_tcp_do_rfc3390)
 		i_cwnd = min(4 * tp->t_maxseg,
 		    max(2 * tp->t_maxseg, 4380));
 	else {
 		/* Per RFC5681 Section 3.1 */
 		if (tp->t_maxseg > 2190)
 			i_cwnd = 2 * tp->t_maxseg;
 		else if (tp->t_maxseg > 1095)
 			i_cwnd = 3 * tp->t_maxseg;
 		else
 			i_cwnd = 4 * tp->t_maxseg;
 	}
 	return (i_cwnd);
 }
 
 /*
  * Given a specified gain, return the target
  * cwnd based on that gain.
  */
 static uint32_t
 bbr_get_raw_target_cwnd(struct tcp_bbr *bbr, uint32_t gain, uint64_t bw)
 {
 	uint64_t bdp, rtt;
 	uint32_t cwnd;
 
 	if ((get_filter_value_small(&bbr->r_ctl.rc_rttprop) == 0xffffffff) ||
 	    (bbr_get_full_bw(bbr) == 0)) {
 		/* No measurements yet */
 		return (bbr_initial_cwnd(bbr, bbr->rc_tp));
 	}
 	/*
 	 * Get bytes per RTT needed (rttProp is normally in
 	 * bbr_cwndtarget_rtt_touse)
 	 */
 	rtt = bbr_get_rtt(bbr, bbr_cwndtarget_rtt_touse);
 	/* Get the bdp from the two values */
 	bdp = bbr_get_bw_delay_prod(rtt, bw);
 	/* Now apply the gain */
 	cwnd = (uint32_t)(((bdp * ((uint64_t)gain)) + (uint64_t)(BBR_UNIT - 1)) / ((uint64_t)BBR_UNIT));
 
 	return (cwnd);
 }
 
 static uint32_t
 bbr_get_target_cwnd(struct tcp_bbr *bbr, uint64_t bw, uint32_t gain)
 {
 	uint32_t cwnd, mss;
 
 	mss = min((bbr->rc_tp->t_maxseg - bbr->rc_last_options), bbr->r_ctl.rc_pace_max_segs);
 	/* Get the base cwnd with gain rounded to a mss */
 	cwnd = roundup(bbr_get_raw_target_cwnd(bbr, bw, gain), mss);
 	/*
 	 * Add in N (2 default since we do not have a
 	 * fq layer to trap packets in) quanta's per the I-D
 	 * section 4.2.3.2 quanta adjust.
 	 */
 	cwnd += (bbr_quanta * bbr->r_ctl.rc_pace_max_segs);
 	if (bbr->rc_use_google) {
 		if((bbr->rc_bbr_state == BBR_STATE_PROBE_BW) &&
 		   (bbr_state_val(bbr) == BBR_SUB_GAIN)) {
 			/*
 			 * The linux implementation adds
 			 * an extra 2 x mss in gain cycle which
 			 * is documented no-where except in the code.
 			 * so we add more for Neal undocumented feature
 			 */
 			cwnd += 2 * mss;
 		}
  		if ((cwnd / mss) & 0x1) {
 			/* Round up for odd num mss */
 			cwnd += mss;
 		}
 	}
 	/* Are we below the min cwnd? */
 	if (cwnd < get_min_cwnd(bbr))
 		return (get_min_cwnd(bbr));
 	return (cwnd);
 }
 
 static uint16_t
 bbr_gain_adjust(struct tcp_bbr *bbr, uint16_t gain)
 {
 	if (gain < 1)
 		gain = 1;
 	return (gain);
 }
 
 static uint32_t
 bbr_get_header_oh(struct tcp_bbr *bbr)
 {
 	int seg_oh;
 
 	seg_oh = 0;
 	if (bbr->r_ctl.rc_inc_tcp_oh) {
 		/* Do we include TCP overhead? */
 		seg_oh = (bbr->rc_last_options + sizeof(struct tcphdr));
 	}
 	if (bbr->r_ctl.rc_inc_ip_oh) {
 		/* Do we include IP overhead? */
 #ifdef INET6
 		if (bbr->r_is_v6) {
 			seg_oh += sizeof(struct ip6_hdr);
 		} else
 #endif
 		{
 
 #ifdef INET
 			seg_oh += sizeof(struct ip);
 #endif
 		}
 	}
 	if (bbr->r_ctl.rc_inc_enet_oh) {
 		/* Do we include the ethernet overhead?  */
 		seg_oh += sizeof(struct ether_header);
 	}
 	return(seg_oh);
 }
 
 static uint32_t
 bbr_get_pacing_length(struct tcp_bbr *bbr, uint16_t gain, uint32_t useconds_time, uint64_t bw)
 {
 	uint64_t divor, res, tim;
 
 	if (useconds_time == 0)
 		return (0);
 	gain = bbr_gain_adjust(bbr, gain);
 	divor = (uint64_t)USECS_IN_SECOND * (uint64_t)BBR_UNIT;
 	tim = useconds_time;
 	res = (tim * bw * gain) / divor;
 	if (res == 0)
 		res = 1;
 	return ((uint32_t)res);
 }
 
 /*
  * Given a gain and a length return the delay in useconds that
  * should be used to evenly space out packets
  * on the connection (based on the gain factor).
  */
 static uint32_t
 bbr_get_pacing_delay(struct tcp_bbr *bbr, uint16_t gain, int32_t len, uint32_t cts, int nolog)
 {
 	uint64_t bw, lentim, res;
 	uint32_t usecs, srtt, over = 0;
 	uint32_t seg_oh, num_segs, maxseg;
 
 	if (len == 0)
 		return (0);
 
 	maxseg = bbr->rc_tp->t_maxseg - bbr->rc_last_options;
 	num_segs = (len + maxseg - 1) / maxseg;
 	if (bbr->rc_use_google == 0) {
 		seg_oh = bbr_get_header_oh(bbr);
 		len += (num_segs * seg_oh);
 	}
 	gain = bbr_gain_adjust(bbr, gain);
 	bw = bbr_get_bw(bbr);
 	if (bbr->rc_use_google) {
 		uint64_t cbw;
 
 		/*
 		 * Reduce the b/w by the google discount
 		 * factor 10 = 1%.
 		 */
 		cbw = bw *  (uint64_t)(1000 - bbr->r_ctl.bbr_google_discount);
 		cbw /= (uint64_t)1000;
 		/* We don't apply a discount if it results in 0 */
 		if (cbw > 0)
 			bw = cbw;
 	}
 	lentim = ((uint64_t)len *
 		  (uint64_t)USECS_IN_SECOND *
 		  (uint64_t)BBR_UNIT);
 	res = lentim / ((uint64_t)gain * bw);
 	if (res == 0)
 		res = 1;
 	usecs = (uint32_t)res;
 	srtt = bbr_get_rtt(bbr, BBR_SRTT);
 	if (bbr_hptsi_max_mul && bbr_hptsi_max_div &&
 	    (bbr->rc_use_google == 0) &&
 	    (usecs > ((srtt * bbr_hptsi_max_mul) / bbr_hptsi_max_div))) {
 		/*
 		 * We cannot let the delay be more than 1/2 the srtt time.
 		 * Otherwise we cannot pace out or send properly.
 		 */
 		over = usecs = (srtt * bbr_hptsi_max_mul) / bbr_hptsi_max_div;
 		BBR_STAT_INC(bbr_hpts_min_time);
 	}
 	if (!nolog)
 		bbr_log_pacing_delay_calc(bbr, gain, len, cts, usecs, bw, over, 1);
 	return (usecs);
 }
 
 static void
 bbr_ack_received(struct tcpcb *tp, struct tcp_bbr *bbr, struct tcphdr *th, uint32_t bytes_this_ack,
 		 uint32_t sack_changed, uint32_t prev_acked, int32_t line, uint32_t losses)
 {
 	uint64_t bw;
 	uint32_t cwnd, target_cwnd, saved_bytes, maxseg;
 	int32_t meth;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 #ifdef STATS
 	if ((tp->t_flags & TF_GPUTINPROG) &&
 	    SEQ_GEQ(th->th_ack, tp->gput_ack)) {
 		/*
 		 * Strech acks and compressed acks will cause this to
 		 * oscillate but we are doing it the same way as the main
 		 * stack so it will be compariable (though possibly not
 		 * ideal).
 		 */
 		int32_t cgput;
 		int64_t gput, time_stamp;
 
 		gput = (int64_t) (th->th_ack - tp->gput_seq) * 8;
 		time_stamp = max(1, ((bbr->r_ctl.rc_rcvtime - tp->gput_ts) / 1000));
 		cgput = gput / time_stamp;
 		stats_voi_update_abs_u32(tp->t_stats, VOI_TCP_GPUT,
 					 cgput);
 		if (tp->t_stats_gput_prev > 0)
 			stats_voi_update_abs_s32(tp->t_stats,
 						 VOI_TCP_GPUT_ND,
 						 ((gput - tp->t_stats_gput_prev) * 100) /
 						 tp->t_stats_gput_prev);
 		tp->t_flags &= ~TF_GPUTINPROG;
 		tp->t_stats_gput_prev = cgput;
 	}
 #endif
 	if ((bbr->rc_bbr_state == BBR_STATE_PROBE_RTT) &&
 	    ((bbr->r_ctl.bbr_rttprobe_gain_val == 0) || bbr->rc_use_google)) {
 		/* We don't change anything in probe-rtt */
 		return;
 	}
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	saved_bytes = bytes_this_ack;
 	bytes_this_ack += sack_changed;
 	if (bytes_this_ack > prev_acked) {
 		bytes_this_ack -= prev_acked;
 		/*
 		 * A byte ack'd gives us a full mss
 		 * to be like linux i.e. they count packets.
 		 */
 		if ((bytes_this_ack < maxseg) && bbr->rc_use_google)
 			bytes_this_ack = maxseg;
 	} else {
 		/* Unlikely */
 		bytes_this_ack = 0;
 	}
 	cwnd = tp->snd_cwnd;
 	bw = get_filter_value(&bbr->r_ctl.rc_delrate);
 	if (bw)
 		target_cwnd = bbr_get_target_cwnd(bbr,
 						  bw,
 						  (uint32_t)bbr->r_ctl.rc_bbr_cwnd_gain);
 	else
 		target_cwnd = bbr_initial_cwnd(bbr, bbr->rc_tp);
 	if (IN_RECOVERY(tp->t_flags) &&
 	    (bbr->bbr_prev_in_rec == 0)) {
 		/*
 		 * We are entering recovery and
 		 * thus packet conservation.
 		 */
 		bbr->pkt_conservation = 1;
 		bbr->r_ctl.rc_recovery_start = bbr->r_ctl.rc_rcvtime;
 		cwnd = ctf_flight_size(tp,
 				       (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) +
 			bytes_this_ack;
 	}
 	if (IN_RECOVERY(tp->t_flags)) {
 		uint32_t flight;
 
 		bbr->bbr_prev_in_rec = 1;
 		if (cwnd > losses) {
 			cwnd -= losses;
 			if (cwnd < maxseg)
 				cwnd = maxseg;
 		} else
 			cwnd = maxseg;
 		flight = ctf_flight_size(tp,
 					 (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		bbr_log_type_cwndupd(bbr, flight, 0,
 				     losses, 10, 0, 0, line);
 		if (bbr->pkt_conservation) {
 			uint32_t time_in;
 
 			if (TSTMP_GEQ(bbr->r_ctl.rc_rcvtime, bbr->r_ctl.rc_recovery_start))
 				time_in = bbr->r_ctl.rc_rcvtime - bbr->r_ctl.rc_recovery_start;
 			else
 				time_in = 0;
 
 			if (time_in >= bbr_get_rtt(bbr, BBR_RTT_PROP)) {
 				/* Clear packet conservation after an rttProp */
 				bbr->pkt_conservation = 0;
 			} else {
 				if ((flight + bytes_this_ack) > cwnd)
 					cwnd = flight + bytes_this_ack;
 				if (cwnd < get_min_cwnd(bbr))
 					cwnd = get_min_cwnd(bbr);
 				tp->snd_cwnd = cwnd;
 				bbr_log_type_cwndupd(bbr, saved_bytes, sack_changed,
 						     prev_acked, 1, target_cwnd, th->th_ack, line);
 				return;
 			}
 		}
 	} else
 		bbr->bbr_prev_in_rec = 0;
 	if ((bbr->rc_use_google == 0) && bbr->r_ctl.restrict_growth) {
 		bbr->r_ctl.restrict_growth--;
 		if (bytes_this_ack > maxseg)
 			bytes_this_ack = maxseg;
 	}
 	if (bbr->rc_filled_pipe) {
 		/*
 		 * Here we have exited startup and filled the pipe. We will
 		 * thus allow the cwnd to shrink to the target. We hit here
 		 * mostly.
 		 */
 		uint32_t s_cwnd;
 
 		meth = 2;
 		s_cwnd = min((cwnd + bytes_this_ack), target_cwnd);
 		if (s_cwnd > cwnd)
 			cwnd = s_cwnd;
 		else if (bbr_cwnd_may_shrink || bbr->rc_use_google || bbr->rc_no_pacing)
 			cwnd = s_cwnd;
 	} else {
 		/*
 		 * Here we are still in startup, we increase cwnd by what
 		 * has been acked.
 		 */
 		if ((cwnd < target_cwnd) ||
 		    (bbr->rc_past_init_win == 0)) {
 			meth = 3;
 			cwnd += bytes_this_ack;
 		} else {
 			/*
 			 * Method 4 means we are at target so no gain in
 			 * startup and past the initial window.
 			 */
 			meth = 4;
 		}
 	}
 	tp->snd_cwnd = max(cwnd, get_min_cwnd(bbr));
 	bbr_log_type_cwndupd(bbr, saved_bytes, sack_changed, prev_acked, meth, target_cwnd, th->th_ack, line);
 }
 
 static void
 tcp_bbr_partialack(struct tcpcb *tp)
 {
 	struct tcp_bbr *bbr;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (ctf_flight_size(tp,
 		(bbr->r_ctl.rc_sacked  + bbr->r_ctl.rc_lost_bytes)) <=
 	    tp->snd_cwnd) {
 		bbr->r_wanted_output = 1;
 	}
 }
 
 static void
 bbr_post_recovery(struct tcpcb *tp)
 {
 	struct tcp_bbr *bbr;
 	uint32_t  flight;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	/*
 	 * Here we just exit recovery.
 	 */
 	EXIT_RECOVERY(tp->t_flags);
 	/* Lock in our b/w reduction for the specified number of pkt-epochs */
 	bbr->r_recovery_bw = 0;
 	tp->snd_recover = tp->snd_una;
 	tcp_bbr_tso_size_check(bbr, bbr->r_ctl.rc_rcvtime);
 	bbr->pkt_conservation = 0;
 	if (bbr->rc_use_google == 0) {
 		/*
 		 * For non-google mode lets
 		 * go ahead and make sure we clear
 		 * the recovery state so if we
 		 * bounce back in to recovery we
 		 * will do PC.
 		 */
 		bbr->bbr_prev_in_rec = 0;
 	}
 	bbr_log_type_exit_rec(bbr);
 	if (bbr->rc_bbr_state != BBR_STATE_PROBE_RTT) {
 		tp->snd_cwnd = max(tp->snd_cwnd, bbr->r_ctl.rc_cwnd_on_ent);
 		bbr_log_type_cwndupd(bbr, 0, 0, 0, 15, 0, 0, __LINE__);
 	} else {
 		/* For probe-rtt case lets fix up its saved_cwnd */
 		if (bbr->r_ctl.rc_saved_cwnd < bbr->r_ctl.rc_cwnd_on_ent) {
 			bbr->r_ctl.rc_saved_cwnd = bbr->r_ctl.rc_cwnd_on_ent;
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 16, 0, 0, __LINE__);
 		}
 	}
 	flight = ctf_flight_size(tp,
 		     (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 	if ((bbr->rc_use_google == 0) &&
 	    bbr_do_red) {
 		uint64_t val, lr2use;
 		uint32_t maxseg, newcwnd, acks_inflight, ratio, cwnd;
 		uint32_t *cwnd_p;
 
 		if (bbr_get_rtt(bbr, BBR_SRTT)) {
 			val = ((uint64_t)bbr_get_rtt(bbr, BBR_RTT_PROP) * (uint64_t)1000);
 			val /= bbr_get_rtt(bbr, BBR_SRTT);
 			ratio = (uint32_t)val;
 		} else
 			ratio = 1000;
 
 		bbr_log_type_cwndupd(bbr, bbr_red_mul, bbr_red_div,
 				     bbr->r_ctl.recovery_lr, 21,
 				     ratio,
 				     bbr->r_ctl.rc_red_cwnd_pe,
 				     __LINE__);
 		if ((ratio < bbr_do_red) || (bbr_do_red == 0))
 			goto done;
 		if (((bbr->rc_bbr_state == BBR_STATE_PROBE_RTT) &&
 		     bbr_prtt_slam_cwnd) ||
 		    (bbr_sub_drain_slam_cwnd &&
 		     (bbr->rc_bbr_state == BBR_STATE_PROBE_BW) &&
 		     bbr->rc_hit_state_1 &&
 		     (bbr_state_val(bbr) == BBR_SUB_DRAIN)) ||
 		    ((bbr->rc_bbr_state == BBR_STATE_DRAIN) &&
 		     bbr_slam_cwnd_in_main_drain)) {
 			/*
 			 * Here we must poke at the saved cwnd
 			 * as well as the cwnd.
 			 */
 			cwnd = bbr->r_ctl.rc_saved_cwnd;
 			cwnd_p = &bbr->r_ctl.rc_saved_cwnd;
 		} else {
  			cwnd = tp->snd_cwnd;
 			cwnd_p = &tp->snd_cwnd;
 		}
 		maxseg = tp->t_maxseg - bbr->rc_last_options;
 		/* Add the overall lr with the recovery lr */
 		if (bbr->r_ctl.rc_lost == 0)
 			lr2use = 0;
 		else if (bbr->r_ctl.rc_delivered == 0)
 			lr2use = 1000;
 		else {
 			lr2use = bbr->r_ctl.rc_lost * 1000;
 			lr2use /= bbr->r_ctl.rc_delivered;
 		}
 		lr2use += bbr->r_ctl.recovery_lr;
 		acks_inflight = (flight / (maxseg * 2));
 		if (bbr_red_scale) {
 			lr2use *= bbr_get_rtt(bbr, BBR_SRTT);
 			lr2use /= bbr_red_scale;
 			if ((bbr_red_growth_restrict) &&
 			    ((bbr_get_rtt(bbr, BBR_SRTT)/bbr_red_scale) > 1))
 			    bbr->r_ctl.restrict_growth += acks_inflight;
 		}
 		if (lr2use) {
 			val = (uint64_t)cwnd * lr2use;
 			val /= 1000;
 			if (cwnd > val)
 				newcwnd = roundup((cwnd - val), maxseg);
 			else
 				newcwnd = maxseg;
 		} else {
 			val = (uint64_t)cwnd * (uint64_t)bbr_red_mul;
 			val /= (uint64_t)bbr_red_div;
 			newcwnd = roundup((uint32_t)val, maxseg);
 		}
 		/* with standard delayed acks how many acks can I expect? */
 		if (bbr_drop_limit == 0) {
 			/*
 			 * Anticpate how much we will
 			 * raise the cwnd based on the acks.
 			 */
 			if ((newcwnd + (acks_inflight * maxseg)) < get_min_cwnd(bbr)) {
 				/* We do enforce the min (with the acks) */
 				newcwnd = (get_min_cwnd(bbr) - acks_inflight);
 			}
 		} else {
 			/*
 			 * A strict drop limit of N is inplace
 			 */
 			if (newcwnd < (bbr_drop_limit * maxseg)) {
 				newcwnd = bbr_drop_limit * maxseg;
 			}
 		}
 		/* For the next N acks do we restrict the growth */
 		*cwnd_p = newcwnd;
 		if (tp->snd_cwnd > newcwnd)
 			tp->snd_cwnd = newcwnd;
 		bbr_log_type_cwndupd(bbr, bbr_red_mul, bbr_red_div, val, 22,
 				     (uint32_t)lr2use,
 				     bbr_get_rtt(bbr, BBR_SRTT), __LINE__);
 		bbr->r_ctl.rc_red_cwnd_pe = bbr->r_ctl.rc_pkt_epoch;
 	}
 done:
 	bbr->r_ctl.recovery_lr = 0;
 	if (flight <= tp->snd_cwnd) {
 		bbr->r_wanted_output = 1;
 	}
 	tcp_bbr_tso_size_check(bbr, bbr->r_ctl.rc_rcvtime);
 }
 
 static void
 bbr_setup_red_bw(struct tcp_bbr *bbr, uint32_t cts)
 {
 	bbr->r_ctl.red_bw = get_filter_value(&bbr->r_ctl.rc_delrate);
 	/* Limit the drop in b/w to 1/2 our current filter. */
 	if (bbr->r_ctl.red_bw > bbr->r_ctl.rc_bbr_cur_del_rate)
 		bbr->r_ctl.red_bw = bbr->r_ctl.rc_bbr_cur_del_rate;
 	if (bbr->r_ctl.red_bw < (get_filter_value(&bbr->r_ctl.rc_delrate) / 2))
 		bbr->r_ctl.red_bw = get_filter_value(&bbr->r_ctl.rc_delrate) / 2;
 	tcp_bbr_tso_size_check(bbr, cts);
 }
 
 static void
 bbr_cong_signal(struct tcpcb *tp, struct tcphdr *th, uint32_t type, struct bbr_sendmap *rsm)
 {
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 #ifdef STATS
 	stats_voi_update_abs_u32(tp->t_stats, VOI_TCP_CSIG, type);
 #endif
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	switch (type) {
 	case CC_NDUPACK:
 		if (!IN_RECOVERY(tp->t_flags)) {
 			tp->snd_recover = tp->snd_max;
 			/* Start a new epoch */
 			bbr_set_pktepoch(bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 			if (bbr->rc_lt_is_sampling || bbr->rc_lt_use_bw) {
 				/*
 				 * Move forward the lt epoch
 				 * so it won't count the truncated
 				 * epoch.
 				 */
 				bbr->r_ctl.rc_lt_epoch++;
 			}
 			if (bbr->rc_bbr_state == BBR_STATE_STARTUP) {
 				/*
 				 * Just like the policer detection code
 				 * if we are in startup we must push
 				 * forward the last startup epoch
 				 * to hide the truncated PE.
 				 */
 				bbr->r_ctl.rc_bbr_last_startup_epoch++;
 			}
 			bbr->r_ctl.rc_cwnd_on_ent = tp->snd_cwnd;
 			ENTER_RECOVERY(tp->t_flags);
 			bbr->rc_tlp_rtx_out = 0;
 			bbr->r_ctl.recovery_lr = bbr->r_ctl.rc_pkt_epoch_loss_rate;
 			tcp_bbr_tso_size_check(bbr, bbr->r_ctl.rc_rcvtime);
 			if (tcp_in_hpts(bbr->rc_tp) &&
 			    ((bbr->r_ctl.rc_hpts_flags & PACE_TMR_RACK) == 0)) {
 				/*
 				 * When we enter recovery, we need to restart
 				 * any timers. This may mean we gain an agg
 				 * early, which will be made up for at the last
 				 * rxt out.
 				 */
 				bbr->rc_timer_first = 1;
 				bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 			}
 			/*
 			 * Calculate a new cwnd based on to the current
 			 * delivery rate with no gain. We get the bdp
 			 * without gaining it up like we normally would and
 			 * we use the last cur_del_rate.
 			 */
 			if ((bbr->rc_use_google == 0) &&
 			    (bbr->r_ctl.bbr_rttprobe_gain_val ||
 			     (bbr->rc_bbr_state != BBR_STATE_PROBE_RTT))) {
 				tp->snd_cwnd = ctf_flight_size(tp,
 					           (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) +
 					(tp->t_maxseg - bbr->rc_last_options);
 				if (tp->snd_cwnd < get_min_cwnd(bbr)) {
 					/* We always gate to min cwnd */
 					tp->snd_cwnd = get_min_cwnd(bbr);
 				}
 				bbr_log_type_cwndupd(bbr, 0, 0, 0, 14, 0, 0, __LINE__);
 			}
 			bbr_log_type_enter_rec(bbr, rsm->r_start);
 		}
 		break;
 	case CC_RTO_ERR:
 		KMOD_TCPSTAT_INC(tcps_sndrexmitbad);
 		/* RTO was unnecessary, so reset everything. */
 		bbr_reset_lt_bw_sampling(bbr, bbr->r_ctl.rc_rcvtime);
 		if (bbr->rc_bbr_state != BBR_STATE_PROBE_RTT) {
 			tp->snd_cwnd = tp->snd_cwnd_prev;
 			tp->snd_ssthresh = tp->snd_ssthresh_prev;
 			tp->snd_recover = tp->snd_recover_prev;
 			tp->snd_cwnd = max(tp->snd_cwnd, bbr->r_ctl.rc_cwnd_on_ent);
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 13, 0, 0, __LINE__);
 		}
 		tp->t_badrxtwin = 0;
 		break;
 	}
 }
 
 /*
  * Indicate whether this ack should be delayed.  We can delay the ack if
  * following conditions are met:
  *	- There is no delayed ack timer in progress.
  *	- Our last ack wasn't a 0-sized window. We never want to delay
  *	  the ack that opens up a 0-sized window.
  *	- LRO wasn't used for this segment. We make sure by checking that the
  *	  segment size is not larger than the MSS.
  *	- Delayed acks are enabled or this is a half-synchronized T/TCP
  *	  connection.
  *	- The data being acked is less than a full segment (a stretch ack
  *        of more than a segment we should ack.
  *      - nsegs is 1 (if its more than that we received more than 1 ack).
  */
 #define DELAY_ACK(tp, bbr, nsegs)				\
 	(((tp->t_flags & TF_RXWIN0SENT) == 0) &&		\
 	 ((tp->t_flags & TF_DELACK) == 0) && 		 	\
 	 ((bbr->bbr_segs_rcvd + nsegs) < tp->t_delayed_ack) &&	\
 	 (tp->t_delayed_ack || (tp->t_flags & TF_NEEDSYN)))
 
 /*
  * Return the lowest RSM in the map of
  * packets still in flight that is not acked.
  * This should normally find on the first one
  * since we remove packets from the send
  * map after they are marked ACKED.
  */
 static struct bbr_sendmap *
 bbr_find_lowest_rsm(struct tcp_bbr *bbr)
 {
 	struct bbr_sendmap *rsm;
 
 	/*
 	 * Walk the time-order transmitted list looking for an rsm that is
 	 * not acked. This will be the one that was sent the longest time
 	 * ago that is still outstanding.
 	 */
 	TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_tmap, r_tnext) {
 		if (rsm->r_flags & BBR_ACKED) {
 			continue;
 		}
 		goto finish;
 	}
 finish:
 	return (rsm);
 }
 
 static struct bbr_sendmap *
 bbr_find_high_nonack(struct tcp_bbr *bbr, struct bbr_sendmap *rsm)
 {
 	struct bbr_sendmap *prsm;
 
 	/*
 	 * Walk the sequence order list backward until we hit and arrive at
 	 * the highest seq not acked. In theory when this is called it
 	 * should be the last segment (which it was not).
 	 */
 	prsm = rsm;
 	TAILQ_FOREACH_REVERSE_FROM(prsm, &bbr->r_ctl.rc_map, bbr_head, r_next) {
 		if (prsm->r_flags & (BBR_ACKED | BBR_HAS_FIN)) {
 			continue;
 		}
 		return (prsm);
 	}
 	return (NULL);
 }
 
 /*
  * Returns to the caller the number of microseconds that
  * the packet can be outstanding before we think we
  * should have had an ack returned.
  */
 static uint32_t
 bbr_calc_thresh_rack(struct tcp_bbr *bbr, uint32_t srtt, uint32_t cts, struct bbr_sendmap *rsm)
 {
 	/*
 	 * lro is the flag we use to determine if we have seen reordering.
 	 * If it gets set we have seen reordering. The reorder logic either
 	 * works in one of two ways:
 	 *
 	 * If reorder-fade is configured, then we track the last time we saw
 	 * re-ordering occur. If we reach the point where enough time as
 	 * passed we no longer consider reordering has occuring.
 	 *
 	 * Or if reorder-face is 0, then once we see reordering we consider
 	 * the connection to alway be subject to reordering and just set lro
 	 * to 1.
 	 *
 	 * In the end if lro is non-zero we add the extra time for
 	 * reordering in.
 	 */
 	int32_t lro;
 	uint32_t thresh, t_rxtcur;
 
 	if (srtt == 0)
 		srtt = 1;
 	if (bbr->r_ctl.rc_reorder_ts) {
 		if (bbr->r_ctl.rc_reorder_fade) {
 			if (SEQ_GEQ(cts, bbr->r_ctl.rc_reorder_ts)) {
 				lro = cts - bbr->r_ctl.rc_reorder_ts;
 				if (lro == 0) {
 					/*
 					 * No time as passed since the last
 					 * reorder, mark it as reordering.
 					 */
 					lro = 1;
 				}
 			} else {
 				/* Negative time? */
 				lro = 0;
 			}
 			if (lro > bbr->r_ctl.rc_reorder_fade) {
 				/* Turn off reordering seen too */
 				bbr->r_ctl.rc_reorder_ts = 0;
 				lro = 0;
 			}
 		} else {
 			/* Reodering does not fade */
 			lro = 1;
 		}
 	} else {
 		lro = 0;
 	}
 	thresh = srtt + bbr->r_ctl.rc_pkt_delay;
 	if (lro) {
 		/* It must be set, if not you get 1/4 rtt */
 		if (bbr->r_ctl.rc_reorder_shift)
 			thresh += (srtt >> bbr->r_ctl.rc_reorder_shift);
 		else
 			thresh += (srtt >> 2);
 	} else {
 		thresh += 1000;
 	}
 	/* We don't let the rack timeout be above a RTO */
 	if ((bbr->rc_tp)->t_srtt == 0)
 		t_rxtcur = BBR_INITIAL_RTO;
 	else
 		t_rxtcur = TICKS_2_USEC(bbr->rc_tp->t_rxtcur);
 	if (thresh > t_rxtcur) {
 		thresh = t_rxtcur;
 	}
 	/* And we don't want it above the RTO max either */
 	if (thresh > (((uint32_t)bbr->rc_max_rto_sec) * USECS_IN_SECOND)) {
 		thresh = (((uint32_t)bbr->rc_max_rto_sec) * USECS_IN_SECOND);
 	}
 	bbr_log_thresh_choice(bbr, cts, thresh, lro, srtt, rsm, BBR_TO_FRM_RACK);
 	return (thresh);
 }
 
 /*
  * Return to the caller the amount of time in mico-seconds
  * that should be used for the TLP timer from the last
  * send time of this packet.
  */
 static uint32_t
 bbr_calc_thresh_tlp(struct tcpcb *tp, struct tcp_bbr *bbr,
     struct bbr_sendmap *rsm, uint32_t srtt,
     uint32_t cts)
 {
 	uint32_t thresh, len, maxseg, t_rxtcur;
 	struct bbr_sendmap *prsm;
 
 	if (srtt == 0)
 		srtt = 1;
 	if (bbr->rc_tlp_threshold)
 		thresh = srtt + (srtt / bbr->rc_tlp_threshold);
 	else
 		thresh = (srtt * 2);
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	/* Get the previous sent packet, if any  */
 	len = rsm->r_end - rsm->r_start;
 
 	/* 2.1 behavior */
 	prsm = TAILQ_PREV(rsm, bbr_head, r_tnext);
 	if (prsm && (len <= maxseg)) {
 		/*
 		 * Two packets outstanding, thresh should be (2*srtt) +
 		 * possible inter-packet delay (if any).
 		 */
 		uint32_t inter_gap = 0;
 		int idx, nidx;
 
 		idx = rsm->r_rtr_cnt - 1;
 		nidx = prsm->r_rtr_cnt - 1;
 		if (TSTMP_GEQ(rsm->r_tim_lastsent[nidx], prsm->r_tim_lastsent[idx])) {
 			/* Yes it was sent later (or at the same time) */
 			inter_gap = rsm->r_tim_lastsent[idx] - prsm->r_tim_lastsent[nidx];
 		}
 		thresh += inter_gap;
 	} else if (len <= maxseg) {
 		/*
 		 * Possibly compensate for delayed-ack.
 		 */
 		uint32_t alt_thresh;
 
 		alt_thresh = srtt + (srtt / 2) + bbr_delayed_ack_time;
 		if (alt_thresh > thresh)
 			thresh = alt_thresh;
 	}
 	/* Not above the current  RTO */
 	if (tp->t_srtt == 0)
 		t_rxtcur = BBR_INITIAL_RTO;
 	else
 		t_rxtcur = TICKS_2_USEC(tp->t_rxtcur);
 
 	bbr_log_thresh_choice(bbr, cts, thresh, t_rxtcur, srtt, rsm, BBR_TO_FRM_TLP);
 	/* Not above an RTO */
 	if (thresh > t_rxtcur) {
 		thresh = t_rxtcur;
 	}
 	/* Not above a RTO max */
 	if (thresh > (((uint32_t)bbr->rc_max_rto_sec) * USECS_IN_SECOND)) {
 		thresh = (((uint32_t)bbr->rc_max_rto_sec) * USECS_IN_SECOND);
 	}
 	/* And now apply the user TLP min */
 	if (thresh < bbr_tlp_min) {
 		thresh = bbr_tlp_min;
 	}
 	return (thresh);
 }
 
 /*
  * Return one of three RTTs to use (in microseconds).
  */
 static __inline uint32_t
 bbr_get_rtt(struct tcp_bbr *bbr, int32_t rtt_type)
 {
 	uint32_t f_rtt;
 	uint32_t srtt;
 
 	f_rtt = get_filter_value_small(&bbr->r_ctl.rc_rttprop);
 	if (get_filter_value_small(&bbr->r_ctl.rc_rttprop) == 0xffffffff) {
 		/* We have no rtt at all */
 		if (bbr->rc_tp->t_srtt == 0)
 			f_rtt = BBR_INITIAL_RTO;
 		else
 			f_rtt = (TICKS_2_USEC(bbr->rc_tp->t_srtt) >> TCP_RTT_SHIFT);
 		/*
 		 * Since we don't know how good the rtt is apply a
 		 * delayed-ack min
 		 */
 		if (f_rtt < bbr_delayed_ack_time) {
 			f_rtt = bbr_delayed_ack_time;
 		}
 	}
 	/* Take the filter version or last measured pkt-rtt */
 	if (rtt_type == BBR_RTT_PROP) {
 		srtt = f_rtt;
 	} else if (rtt_type == BBR_RTT_PKTRTT) {
 		if (bbr->r_ctl.rc_pkt_epoch_rtt) {
 			srtt = bbr->r_ctl.rc_pkt_epoch_rtt;
 		} else {
 			/* No pkt rtt yet */
 			srtt = f_rtt;
 		}
 	} else if (rtt_type == BBR_RTT_RACK) {
 		srtt = bbr->r_ctl.rc_last_rtt;
 		/* We need to add in any internal delay for our timer */
 		if (bbr->rc_ack_was_delayed)
 			srtt += bbr->r_ctl.rc_ack_hdwr_delay;
 	} else if (rtt_type == BBR_SRTT) {
 		srtt = (TICKS_2_USEC(bbr->rc_tp->t_srtt) >> TCP_RTT_SHIFT);
 	} else {
 		/* TSNH */
 		srtt = f_rtt;
 #ifdef BBR_INVARIANTS
 		panic("Unknown rtt request type %d", rtt_type);
 #endif
 	}
 	return (srtt);
 }
 
 static int
 bbr_is_lost(struct tcp_bbr *bbr, struct bbr_sendmap *rsm, uint32_t cts)
 {
 	uint32_t thresh;
 
 	thresh = bbr_calc_thresh_rack(bbr, bbr_get_rtt(bbr, BBR_RTT_RACK),
 				      cts, rsm);
 	if ((cts - rsm->r_tim_lastsent[(rsm->r_rtr_cnt - 1)]) >= thresh) {
 		/* It is lost (past time) */
 		return (1);
 	}
 	return (0);
 }
 
 /*
  * Return a sendmap if we need to retransmit something.
  */
 static struct bbr_sendmap *
 bbr_check_recovery_mode(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * Check to see that we don't need to fall into recovery. We will
 	 * need to do so if our oldest transmit is past the time we should
 	 * have had an ack.
 	 */
 
 	struct bbr_sendmap *rsm;
 	int32_t idx;
 
 	if (TAILQ_EMPTY(&bbr->r_ctl.rc_map)) {
 		/* Nothing outstanding that we know of */
 		return (NULL);
 	}
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 	if (rsm == NULL) {
 		/* Nothing in the transmit map */
 		return (NULL);
 	}
 	if (tp->t_flags & TF_SENTFIN) {
 		/* Fin restricted, don't find anything once a fin is sent */
 		return (NULL);
 	}
 	if (rsm->r_flags & BBR_ACKED) {
 		/*
 		 * Ok the first one is acked (this really should not happen
 		 * since we remove the from the tmap once they are acked)
 		 */
 		rsm = bbr_find_lowest_rsm(bbr);
 		if (rsm == NULL)
 			return (NULL);
 	}
 	idx = rsm->r_rtr_cnt - 1;
 	if (SEQ_LEQ(cts, rsm->r_tim_lastsent[idx])) {
 		/* Send timestamp is the same or less? can't be ready */
 		return (NULL);
 	}
 	/* Get our RTT time */
 	if (bbr_is_lost(bbr, rsm, cts) &&
 	    ((rsm->r_dupack >= DUP_ACK_THRESHOLD) ||
 	     (rsm->r_flags & BBR_SACK_PASSED))) {
 		if ((rsm->r_flags & BBR_MARKED_LOST) == 0) {
 			rsm->r_flags |= BBR_MARKED_LOST;
 			bbr->r_ctl.rc_lost += rsm->r_end - rsm->r_start;
 			bbr->r_ctl.rc_lost_bytes += rsm->r_end - rsm->r_start;
 		}
 		bbr_cong_signal(tp, NULL, CC_NDUPACK, rsm);
 #ifdef BBR_INVARIANTS
 		if ((rsm->r_end - rsm->r_start) == 0)
 			panic("tp:%p bbr:%p rsm:%p length is 0?", tp, bbr, rsm);
 #endif
 		return (rsm);
 	}
 	return (NULL);
 }
 
 /*
  * RACK Timer, here we simply do logging and house keeping.
  * the normal bbr_output_wtime() function will call the
  * appropriate thing to check if we need to do a RACK retransmit.
  * We return 1, saying don't proceed with bbr_output_wtime only
  * when all timers have been stopped (destroyed PCB?).
  */
 static int
 bbr_timeout_rack(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * This timer simply provides an internal trigger to send out data.
 	 * The check_recovery_mode call will see if there are needed
 	 * retransmissions, if so we will enter fast-recovery. The output
 	 * call may or may not do the same thing depending on sysctl
 	 * settings.
 	 */
 	uint32_t lost;
 
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	if (TSTMP_LT(cts, bbr->r_ctl.rc_timer_exp)) {
 		/* Its not time yet */
 		return (0);
 	}
 	BBR_STAT_INC(bbr_to_tot);
 	lost = bbr->r_ctl.rc_lost;
 	if (bbr->r_state && (bbr->r_state != tp->t_state))
 		bbr_set_state(tp, bbr, 0);
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_RACK);
 	if (bbr->r_ctl.rc_resend == NULL) {
 		/* Lets do the check here */
 		bbr->r_ctl.rc_resend = bbr_check_recovery_mode(tp, bbr, cts);
 	}
 	if (bbr_policer_call_from_rack_to)
 		bbr_lt_bw_sampling(bbr, cts, (bbr->r_ctl.rc_lost > lost));
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_RACK;
 	return (0);
 }
 
 static __inline void
 bbr_clone_rsm(struct tcp_bbr *bbr, struct bbr_sendmap *nrsm, struct bbr_sendmap *rsm, uint32_t start)
 {
 	int idx;
 
 	nrsm->r_start = start;
 	nrsm->r_end = rsm->r_end;
 	nrsm->r_rtr_cnt = rsm->r_rtr_cnt;
 	nrsm-> r_rtt_not_allowed = rsm->r_rtt_not_allowed;
 	nrsm->r_flags = rsm->r_flags;
 	/* We don't transfer forward the SYN flag */
 	nrsm->r_flags &= ~BBR_HAS_SYN;
 	/* We move forward the FIN flag, not that this should happen */
 	rsm->r_flags &= ~BBR_HAS_FIN;
 	nrsm->r_dupack = rsm->r_dupack;
 	nrsm->r_rtr_bytes = 0;
 	nrsm->r_is_gain = rsm->r_is_gain;
 	nrsm->r_is_drain = rsm->r_is_drain;
 	nrsm->r_delivered = rsm->r_delivered;
 	nrsm->r_ts_valid = rsm->r_ts_valid;
 	nrsm->r_del_ack_ts = rsm->r_del_ack_ts;
 	nrsm->r_del_time = rsm->r_del_time;
 	nrsm->r_app_limited = rsm->r_app_limited;
 	nrsm->r_first_sent_time = rsm->r_first_sent_time;
 	nrsm->r_flight_at_send = rsm->r_flight_at_send;
 	/* We split a piece the lower section looses any just_ret flag. */
 	nrsm->r_bbr_state = rsm->r_bbr_state;
 	for (idx = 0; idx < nrsm->r_rtr_cnt; idx++) {
 		nrsm->r_tim_lastsent[idx] = rsm->r_tim_lastsent[idx];
 	}
 	rsm->r_end = nrsm->r_start;
 	idx = min((bbr->rc_tp->t_maxseg - bbr->rc_last_options), bbr->r_ctl.rc_pace_max_segs);
 	idx /= 8;
 	/* Check if we got too small */
 	if ((rsm->r_is_smallmap == 0) &&
 	    ((rsm->r_end - rsm->r_start) <= idx)) {
 		bbr->r_ctl.rc_num_small_maps_alloced++;
 		rsm->r_is_smallmap = 1;
 	}
 	/* Check the new one as well */
 	if ((nrsm->r_end - nrsm->r_start) <= idx) {
 		bbr->r_ctl.rc_num_small_maps_alloced++;
 		nrsm->r_is_smallmap = 1;
 	}
 }
 
 static int
 bbr_sack_mergable(struct bbr_sendmap *at,
 		  uint32_t start, uint32_t end)
 {
 	/*
 	 * Given a sack block defined by
 	 * start and end, and a current position
 	 * at. Return 1 if either side of at
 	 * would show that the block is mergable
 	 * to that side. A block to be mergable
 	 * must have overlap with the start/end
 	 * and be in the SACK'd state.
 	 */
 	struct bbr_sendmap *l_rsm;
 	struct bbr_sendmap *r_rsm;
 
 	/* first get the either side blocks */
 	l_rsm = TAILQ_PREV(at, bbr_head, r_next);
 	r_rsm = TAILQ_NEXT(at, r_next);
 	if (l_rsm && (l_rsm->r_flags & BBR_ACKED)) {
 		/* Potentially mergeable */
 		if ((l_rsm->r_end == start) ||
 		    (SEQ_LT(start, l_rsm->r_end) &&
 		     SEQ_GT(end, l_rsm->r_end))) {
 			    /*
 			     * map blk   |------|
 			     * sack blk         |------|
 			     * <or>
 			     * map blk   |------|
 			     * sack blk      |------|
 			     */
 			    return (1);
 		    }
 	}
 	if (r_rsm && (r_rsm->r_flags & BBR_ACKED)) {
 		/* Potentially mergeable */
 		if ((r_rsm->r_start == end) ||
 		    (SEQ_LT(start, r_rsm->r_start) &&
 		     SEQ_GT(end, r_rsm->r_start))) {
 			/*
 			 * map blk          |---------|
 			 * sack blk    |----|
 			 * <or>
 			 * map blk          |---------|
 			 * sack blk    |-------|
 			 */
 			return (1);
 		}
 	}
 	return (0);
 }
 
 static struct bbr_sendmap *
 bbr_merge_rsm(struct tcp_bbr *bbr,
 	      struct bbr_sendmap *l_rsm,
 	      struct bbr_sendmap *r_rsm)
 {
 	/*
 	 * We are merging two ack'd RSM's,
 	 * the l_rsm is on the left (lower seq
 	 * values) and the r_rsm is on the right
 	 * (higher seq value). The simplest way
 	 * to merge these is to move the right
 	 * one into the left. I don't think there
 	 * is any reason we need to try to find
 	 * the oldest (or last oldest retransmitted).
 	 */
 	l_rsm->r_end = r_rsm->r_end;
 	if (l_rsm->r_dupack < r_rsm->r_dupack)
 		l_rsm->r_dupack = r_rsm->r_dupack;
 	if (r_rsm->r_rtr_bytes)
 		l_rsm->r_rtr_bytes += r_rsm->r_rtr_bytes;
 	if (r_rsm->r_in_tmap) {
 		/* This really should not happen */
 		TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, r_rsm, r_tnext);
 	}
 	if (r_rsm->r_app_limited)
 		l_rsm->r_app_limited = r_rsm->r_app_limited;
 	/* Now the flags */
 	if (r_rsm->r_flags & BBR_HAS_FIN)
 		l_rsm->r_flags |= BBR_HAS_FIN;
 	if (r_rsm->r_flags & BBR_TLP)
 		l_rsm->r_flags |= BBR_TLP;
 	if (r_rsm->r_flags & BBR_RWND_COLLAPSED)
 		l_rsm->r_flags |= BBR_RWND_COLLAPSED;
 	if (r_rsm->r_flags & BBR_MARKED_LOST) {
 		/* This really should not happen */
 		bbr->r_ctl.rc_lost_bytes -= r_rsm->r_end - r_rsm->r_start;
 	}
 	TAILQ_REMOVE(&bbr->r_ctl.rc_map, r_rsm, r_next);
 	if ((r_rsm->r_limit_type == 0) && (l_rsm->r_limit_type != 0)) {
 		/* Transfer the split limit to the map we free */
 		r_rsm->r_limit_type = l_rsm->r_limit_type;
 		l_rsm->r_limit_type = 0;
 	}
 	bbr_free(bbr, r_rsm);
 	return(l_rsm);
 }
 
 /*
  * TLP Timer, here we simply setup what segment we want to
  * have the TLP expire on, the normal bbr_output_wtime() will then
  * send it out.
  *
  * We return 1, saying don't proceed with bbr_output_wtime only
  * when all timers have been stopped (destroyed PCB?).
  */
 static int
 bbr_timeout_tlp(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * Tail Loss Probe.
 	 */
 	struct bbr_sendmap *rsm = NULL;
 	struct socket *so;
 	uint32_t amm;
 	uint32_t out, avail;
 	uint32_t maxseg;
 	int collapsed_win = 0;
 
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	if (TSTMP_LT(cts, bbr->r_ctl.rc_timer_exp)) {
 		/* Its not time yet */
 		return (0);
 	}
 	if (ctf_progress_timeout_check(tp, true)) {
 		bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 		return (-ETIMEDOUT);	/* tcp_drop() */
 	}
 	/* Did we somehow get into persists? */
 	if (bbr->rc_in_persist) {
 		return (0);
 	}
 	if (bbr->r_state && (bbr->r_state != tp->t_state))
 		bbr_set_state(tp, bbr, 0);
 	BBR_STAT_INC(bbr_tlp_tot);
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	/*
 	 * A TLP timer has expired. We have been idle for 2 rtts. So we now
 	 * need to figure out how to force a full MSS segment out.
 	 */
 	so = tptosocket(tp);
 	avail = sbavail(&so->so_snd);
 	out = ctf_outstanding(tp);
 	if (out > tp->snd_wnd) {
 		/* special case, we need a retransmission */
 		collapsed_win = 1;
 		goto need_retran;
 	}
 	if (avail > out) {
 		/* New data is available */
 		amm = avail - out;
 		if (amm > maxseg) {
 			amm = maxseg;
 		} else if ((amm < maxseg) && ((tp->t_flags & TF_NODELAY) == 0)) {
 			/* not enough to fill a MTU and no-delay is off */
 			goto need_retran;
 		}
 		/* Set the send-new override */
 		if ((out + amm) <= tp->snd_wnd) {
 			bbr->rc_tlp_new_data = 1;
 		} else {
 			goto need_retran;
 		}
 		bbr->r_ctl.rc_tlp_seg_send_cnt = 0;
 		bbr->r_ctl.rc_last_tlp_seq = tp->snd_max;
 		bbr->r_ctl.rc_tlp_send = NULL;
 		/* cap any slots */
 		BBR_STAT_INC(bbr_tlp_newdata);
 		goto send;
 	}
 need_retran:
 	/*
 	 * Ok we need to arrange the last un-acked segment to be re-sent, or
 	 * optionally the first un-acked segment.
 	 */
 	if (collapsed_win == 0) {
 		rsm = TAILQ_LAST_FAST(&bbr->r_ctl.rc_map, bbr_sendmap, r_next);
 		if (rsm && (BBR_ACKED | BBR_HAS_FIN)) {
 			rsm = bbr_find_high_nonack(bbr, rsm);
 		}
 		if (rsm == NULL) {
 			goto restore;
 		}
 	} else {
 		/*
 		 * We must find the last segment
 		 * that was acceptable by the client.
 		 */
 		TAILQ_FOREACH_REVERSE(rsm, &bbr->r_ctl.rc_map, bbr_head, r_next) {
 			if ((rsm->r_flags & BBR_RWND_COLLAPSED) == 0) {
 				/* Found one */
 				break;
 			}
 		}
 		if (rsm == NULL) {
 			/* None? if so send the first */
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 			if (rsm == NULL)
 				goto restore;
 		}
 	}
 	if ((rsm->r_end - rsm->r_start) > maxseg) {
 		/*
 		 * We need to split this the last segment in two.
 		 */
 		struct bbr_sendmap *nrsm;
 
 		nrsm = bbr_alloc_full_limit(bbr);
 		if (nrsm == NULL) {
 			/*
 			 * We can't get memory to split, we can either just
 			 * not split it. Or retransmit the whole piece, lets
 			 * do the large send (BTLP :-) ).
 			 */
 			goto go_for_it;
 		}
 		bbr_clone_rsm(bbr, nrsm, rsm, (rsm->r_end - maxseg));
 		TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 		if (rsm->r_in_tmap) {
 			TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 			nrsm->r_in_tmap = 1;
 		}
 		rsm->r_flags &= (~BBR_HAS_FIN);
 		rsm = nrsm;
 	}
 go_for_it:
 	bbr->r_ctl.rc_tlp_send = rsm;
 	bbr->rc_tlp_rtx_out = 1;
 	if (rsm->r_start == bbr->r_ctl.rc_last_tlp_seq) {
 		bbr->r_ctl.rc_tlp_seg_send_cnt++;
 		tp->t_rxtshift++;
 	} else {
 		bbr->r_ctl.rc_last_tlp_seq = rsm->r_start;
 		bbr->r_ctl.rc_tlp_seg_send_cnt = 1;
 	}
 send:
 	if (bbr->r_ctl.rc_tlp_seg_send_cnt > bbr_tlp_max_resend) {
 		/*
 		 * Can't [re]/transmit a segment we have retransmitted the
 		 * max times. We need the retransmit timer to take over.
 		 */
 restore:
 		bbr->rc_tlp_new_data = 0;
 		bbr->r_ctl.rc_tlp_send = NULL;
 		if (rsm)
 			rsm->r_flags &= ~BBR_TLP;
 		BBR_STAT_INC(bbr_tlp_retran_fail);
 		return (0);
 	} else if (rsm) {
 		rsm->r_flags |= BBR_TLP;
 	}
 	if (rsm && (rsm->r_start == bbr->r_ctl.rc_last_tlp_seq) &&
 	    (bbr->r_ctl.rc_tlp_seg_send_cnt > bbr_tlp_max_resend)) {
 		/*
 		 * We have retransmitted to many times for TLP. Switch to
 		 * the regular RTO timer
 		 */
 		goto restore;
 	}
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_TLP);
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_TLP;
 	return (0);
 }
 
 /*
  * Delayed ack Timer, here we simply need to setup the
  * ACK_NOW flag and remove the DELACK flag. From there
  * the output routine will send the ack out.
  *
  * We only return 1, saying don't proceed, if all timers
  * are stopped (destroyed PCB?).
  */
 static int
 bbr_timeout_delack(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_DELACK);
 	tp->t_flags &= ~TF_DELACK;
 	tp->t_flags |= TF_ACKNOW;
 	KMOD_TCPSTAT_INC(tcps_delack);
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_DELACK;
 	return (0);
 }
 
 /*
  * Here we send a KEEP-ALIVE like probe to the
  * peer, we do not send data.
  *
  * We only return 1, saying don't proceed, if all timers
  * are stopped (destroyed PCB?).
  */
 static int
 bbr_timeout_persist(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	struct tcptemp *t_template;
 	int32_t retval = 1;
 
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	if (bbr->rc_in_persist == 0)
 		return (0);
 
 	/*
 	 * Persistence timer into zero window. Force a byte to be output, if
 	 * possible.
 	 */
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_PERSIST);
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_PERSIT;
 	KMOD_TCPSTAT_INC(tcps_persisttimeo);
 	/*
 	 * Have we exceeded the user specified progress time?
 	 */
 	if (ctf_progress_timeout_check(tp, true)) {
 		bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 		return (-ETIMEDOUT);	/* tcp_drop() */
 	}
 	/*
 	 * Hack: if the peer is dead/unreachable, we do not time out if the
 	 * window is closed.  After a full backoff, drop the connection if
 	 * the idle time (no responses to probes) reaches the maximum
 	 * backoff that we would use if retransmitting.
 	 */
 	if (tp->t_rxtshift >= V_tcp_retries &&
 	    (ticks - tp->t_rcvtime >= tcp_maxpersistidle ||
 	    ticks - tp->t_rcvtime >= TCP_REXMTVAL(tp) * tcp_totbackoff)) {
 		KMOD_TCPSTAT_INC(tcps_persistdrop);
 		tcp_log_end_status(tp, TCP_EI_STATUS_PERSIST_MAX);
 		return (-ETIMEDOUT);	/* tcp_drop() */
 	}
 	if ((sbavail(&bbr->rc_inp->inp_socket->so_snd) == 0) &&
 	    tp->snd_una == tp->snd_max) {
 		bbr_exit_persist(tp, bbr, cts, __LINE__);
 		retval = 0;
 		goto out;
 	}
 	/*
 	 * If the user has closed the socket then drop a persisting
 	 * connection after a much reduced timeout.
 	 */
 	if (tp->t_state > TCPS_CLOSE_WAIT &&
 	    (ticks - tp->t_rcvtime) >= TCPTV_PERSMAX) {
 		KMOD_TCPSTAT_INC(tcps_persistdrop);
 		tcp_log_end_status(tp, TCP_EI_STATUS_PERSIST_MAX);
 		return (-ETIMEDOUT);	/* tcp_drop() */
 	}
 	t_template = tcpip_maketemplate(bbr->rc_inp);
 	if (t_template) {
 		tcp_respond(tp, t_template->tt_ipgen,
 			    &t_template->tt_t, (struct mbuf *)NULL,
 			    tp->rcv_nxt, tp->snd_una - 1, 0);
 		/* This sends an ack */
 		if (tp->t_flags & TF_DELACK)
 			tp->t_flags &= ~TF_DELACK;
 		free(t_template, M_TEMP);
 	}
 	if (tp->t_rxtshift < V_tcp_retries)
 		tp->t_rxtshift++;
 	bbr_start_hpts_timer(bbr, tp, cts, 3, 0, 0);
 out:
 	return (retval);
 }
 
 /*
  * If a keepalive goes off, we had no other timers
  * happening. We always return 1 here since this
  * routine either drops the connection or sends
  * out a segment with respond.
  */
 static int
 bbr_timeout_keepalive(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	struct tcptemp *t_template;
 	struct inpcb *inp = tptoinpcb(tp);
 
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_KEEP;
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_KEEP);
 	/*
 	 * Keep-alive timer went off; send something or drop connection if
 	 * idle for too long.
 	 */
 	KMOD_TCPSTAT_INC(tcps_keeptimeo);
 	if (tp->t_state < TCPS_ESTABLISHED)
 		goto dropit;
 	if ((V_tcp_always_keepalive || inp->inp_socket->so_options & SO_KEEPALIVE) &&
 	    tp->t_state <= TCPS_CLOSING) {
 		if (ticks - tp->t_rcvtime >= TP_KEEPIDLE(tp) + TP_MAXIDLE(tp))
 			goto dropit;
 		/*
 		 * Send a packet designed to force a response if the peer is
 		 * up and reachable: either an ACK if the connection is
 		 * still alive, or an RST if the peer has closed the
 		 * connection due to timeout or reboot. Using sequence
 		 * number tp->snd_una-1 causes the transmitted zero-length
 		 * segment to lie outside the receive window; by the
 		 * protocol spec, this requires the correspondent TCP to
 		 * respond.
 		 */
 		KMOD_TCPSTAT_INC(tcps_keepprobe);
 		t_template = tcpip_maketemplate(inp);
 		if (t_template) {
 			tcp_respond(tp, t_template->tt_ipgen,
 			    &t_template->tt_t, (struct mbuf *)NULL,
 			    tp->rcv_nxt, tp->snd_una - 1, 0);
 			free(t_template, M_TEMP);
 		}
 	}
 	bbr_start_hpts_timer(bbr, tp, cts, 4, 0, 0);
 	return (1);
 dropit:
 	KMOD_TCPSTAT_INC(tcps_keepdrops);
 	tcp_log_end_status(tp, TCP_EI_STATUS_KEEP_MAX);
 	return (-ETIMEDOUT);	/* tcp_drop() */
 }
 
 /*
  * Retransmit helper function, clear up all the ack
  * flags and take care of important book keeping.
  */
 static void
 bbr_remxt_tmr(struct tcpcb *tp)
 {
 	/*
 	 * The retransmit timer went off, all sack'd blocks must be
 	 * un-acked.
 	 */
 	struct bbr_sendmap *rsm, *trsm = NULL;
 	struct tcp_bbr *bbr;
 	uint32_t cts, lost;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	cts = tcp_get_usecs(&bbr->rc_tv);
 	lost = bbr->r_ctl.rc_lost;
 	if (bbr->r_state && (bbr->r_state != tp->t_state))
 		bbr_set_state(tp, bbr, 0);
 
 	TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_map, r_next) {
 		if (rsm->r_flags & BBR_ACKED) {
 			uint32_t old_flags;
 
 			rsm->r_dupack = 0;
 			if (rsm->r_in_tmap == 0) {
 				/* We must re-add it back to the tlist */
 				if (trsm == NULL) {
 					TAILQ_INSERT_HEAD(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 				} else {
 					TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, trsm, rsm, r_tnext);
 				}
 				rsm->r_in_tmap = 1;
 			}
 			old_flags = rsm->r_flags;
 			rsm->r_flags |= BBR_RXT_CLEARED;
 			rsm->r_flags &= ~(BBR_ACKED | BBR_SACK_PASSED | BBR_WAS_SACKPASS);
 			bbr_log_type_rsmclear(bbr, cts, rsm, old_flags, __LINE__);
 		} else {
 			if ((tp->t_state < TCPS_ESTABLISHED) &&
 			    (rsm->r_start == tp->snd_una)) {
 				/*
 				 * Special case for TCP FO. Where
 				 * we sent more data beyond the snd_max.
 				 * We don't mark that as lost and stop here.
 				 */
 				break;
 			}
 			if ((rsm->r_flags & BBR_MARKED_LOST) == 0) {
 				bbr->r_ctl.rc_lost += rsm->r_end - rsm->r_start;
 				bbr->r_ctl.rc_lost_bytes += rsm->r_end - rsm->r_start;
 			}
 			if (bbr_marks_rxt_sack_passed) {
 				/*
 				 * With this option, we will rack out
 				 * in 1ms increments the rest of the packets.
 				 */
 				rsm->r_flags |= BBR_SACK_PASSED | BBR_MARKED_LOST;
 				rsm->r_flags &= ~BBR_WAS_SACKPASS;
 			} else {
 				/*
 				 * With this option we only mark them lost
 				 * and remove all sack'd markings. We will run
 				 * another RXT or a TLP. This will cause
 				 * us to eventually send more based on what
 				 * ack's come in.
 				 */
 				rsm->r_flags |= BBR_MARKED_LOST;
 				rsm->r_flags &= ~BBR_WAS_SACKPASS;
 				rsm->r_flags &= ~BBR_SACK_PASSED;
 			}
 		}
 		trsm = rsm;
 	}
 	bbr->r_ctl.rc_resend = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 	/* Clear the count (we just un-acked them) */
 	bbr_log_to_event(bbr, cts, BBR_TO_FRM_TMR);
 	bbr->rc_tlp_new_data = 0;
 	bbr->r_ctl.rc_tlp_seg_send_cnt = 0;
 	/* zap the behindness on a rxt */
 	bbr->r_ctl.rc_hptsi_agg_delay = 0;
 	bbr->r_agg_early_set = 0;
 	bbr->r_ctl.rc_agg_early = 0;
 	bbr->rc_tlp_rtx_out = 0;
 	bbr->r_ctl.rc_sacked = 0;
 	bbr->r_ctl.rc_sacklast = NULL;
 	bbr->r_timer_override = 1;
 	bbr_lt_bw_sampling(bbr, cts, (bbr->r_ctl.rc_lost > lost));
 }
 
 /*
  * Re-transmit timeout! If we drop the PCB we will return 1, otherwise
  * we will setup to retransmit the lowest seq number outstanding.
  */
 static int
 bbr_timeout_rxt(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	int32_t rexmt;
 	int32_t retval = 0;
 	bool isipv6;
 
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_RXT;
 	if (bbr->rc_all_timers_stopped) {
 		return (1);
 	}
 	if (TCPS_HAVEESTABLISHED(tp->t_state) &&
 	    (tp->snd_una == tp->snd_max)) {
 		/* Nothing outstanding .. nothing to do */
 		return (0);
 	}
 	/*
 	 * Retransmission timer went off.  Message has not been acked within
 	 * retransmit interval.  Back off to a longer retransmit interval
 	 * and retransmit one segment.
 	 */
 	if (ctf_progress_timeout_check(tp, true)) {
 		bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 		return (-ETIMEDOUT);	/* tcp_drop() */
 	}
 	bbr_remxt_tmr(tp);
 	if ((bbr->r_ctl.rc_resend == NULL) ||
 	    ((bbr->r_ctl.rc_resend->r_flags & BBR_RWND_COLLAPSED) == 0)) {
 		/*
 		 * If the rwnd collapsed on
 		 * the one we are retransmitting
 		 * it does not count against the
 		 * rxt count.
 		 */
 		tp->t_rxtshift++;
 	}
 	if (tp->t_rxtshift > V_tcp_retries) {
 		tp->t_rxtshift = V_tcp_retries;
 		KMOD_TCPSTAT_INC(tcps_timeoutdrop);
 		tcp_log_end_status(tp, TCP_EI_STATUS_RETRAN);
 		/* XXXGL: previously t_softerror was casted to uint16_t */
 		MPASS(tp->t_softerror >= 0);
 		retval = tp->t_softerror ? -tp->t_softerror : -ETIMEDOUT;
 		return (retval);	/* tcp_drop() */
 	}
 	if (tp->t_state == TCPS_SYN_SENT) {
 		/*
 		 * If the SYN was retransmitted, indicate CWND to be limited
 		 * to 1 segment in cc_conn_init().
 		 */
 		tp->snd_cwnd = 1;
 	} else if (tp->t_rxtshift == 1) {
 		/*
 		 * first retransmit; record ssthresh and cwnd so they can be
 		 * recovered if this turns out to be a "bad" retransmit. A
 		 * retransmit is considered "bad" if an ACK for this segment
 		 * is received within RTT/2 interval; the assumption here is
 		 * that the ACK was already in flight.  See "On Estimating
 		 * End-to-End Network Path Properties" by Allman and Paxson
 		 * for more details.
 		 */
 		tp->snd_cwnd = tp->t_maxseg - bbr->rc_last_options;
 		if (!IN_RECOVERY(tp->t_flags)) {
 			tp->snd_cwnd_prev = tp->snd_cwnd;
 			tp->snd_ssthresh_prev = tp->snd_ssthresh;
 			tp->snd_recover_prev = tp->snd_recover;
 			tp->t_badrxtwin = ticks + (tp->t_srtt >> (TCP_RTT_SHIFT + 1));
 			tp->t_flags |= TF_PREVVALID;
 		} else {
 			tp->t_flags &= ~TF_PREVVALID;
 		}
 		tp->snd_cwnd = tp->t_maxseg - bbr->rc_last_options;
 	} else {
 		tp->snd_cwnd = tp->t_maxseg - bbr->rc_last_options;
 		tp->t_flags &= ~TF_PREVVALID;
 	}
 	KMOD_TCPSTAT_INC(tcps_rexmttimeo);
 	if ((tp->t_state == TCPS_SYN_SENT) ||
 	    (tp->t_state == TCPS_SYN_RECEIVED))
 		rexmt = USEC_2_TICKS(BBR_INITIAL_RTO) * tcp_backoff[tp->t_rxtshift];
 	else
 		rexmt = TCP_REXMTVAL(tp) * tcp_backoff[tp->t_rxtshift];
 	TCPT_RANGESET(tp->t_rxtcur, rexmt,
 	    MSEC_2_TICKS(bbr->r_ctl.rc_min_rto_ms),
 	    MSEC_2_TICKS(((uint32_t)bbr->rc_max_rto_sec) * 1000));
 	/*
 	 * We enter the path for PLMTUD if connection is established or, if
 	 * connection is FIN_WAIT_1 status, reason for the last is that if
 	 * amount of data we send is very small, we could send it in couple
 	 * of packets and process straight to FIN. In that case we won't
 	 * catch ESTABLISHED state.
 	 */
 #ifdef INET6
 	isipv6 = (inp->inp_vflag & INP_IPV6) ? true : false;
 #else
 	isipv6 = false;
 #endif
 	if (((V_tcp_pmtud_blackhole_detect == 1) ||
 	    (V_tcp_pmtud_blackhole_detect == 2 && !isipv6) ||
 	    (V_tcp_pmtud_blackhole_detect == 3 && isipv6)) &&
 	    ((tp->t_state == TCPS_ESTABLISHED) ||
 	    (tp->t_state == TCPS_FIN_WAIT_1))) {
 		/*
 		 * Idea here is that at each stage of mtu probe (usually,
 		 * 1448 -> 1188 -> 524) should be given 2 chances to recover
 		 * before further clamping down. 'tp->t_rxtshift % 2 == 0'
 		 * should take care of that.
 		 */
 		if (((tp->t_flags2 & (TF2_PLPMTU_PMTUD | TF2_PLPMTU_MAXSEGSNT)) ==
 		    (TF2_PLPMTU_PMTUD | TF2_PLPMTU_MAXSEGSNT)) &&
 		    (tp->t_rxtshift >= 2 && tp->t_rxtshift < 6 &&
 		    tp->t_rxtshift % 2 == 0)) {
 			/*
 			 * Enter Path MTU Black-hole Detection mechanism: -
 			 * Disable Path MTU Discovery (IP "DF" bit). -
 			 * Reduce MTU to lower value than what we negotiated
 			 * with peer.
 			 */
 			if ((tp->t_flags2 & TF2_PLPMTU_BLACKHOLE) == 0) {
 				/*
 				 * Record that we may have found a black
 				 * hole.
 				 */
 				tp->t_flags2 |= TF2_PLPMTU_BLACKHOLE;
 				/* Keep track of previous MSS. */
 				tp->t_pmtud_saved_maxseg = tp->t_maxseg;
 			}
 			/*
 			 * Reduce the MSS to blackhole value or to the
 			 * default in an attempt to retransmit.
 			 */
 #ifdef INET6
 			isipv6 = bbr->r_is_v6;
 			if (isipv6 &&
 			    tp->t_maxseg > V_tcp_v6pmtud_blackhole_mss) {
 				/* Use the sysctl tuneable blackhole MSS. */
 				tp->t_maxseg = V_tcp_v6pmtud_blackhole_mss;
 				KMOD_TCPSTAT_INC(tcps_pmtud_blackhole_activated);
 			} else if (isipv6) {
 				/* Use the default MSS. */
 				tp->t_maxseg = V_tcp_v6mssdflt;
 				/*
 				 * Disable Path MTU Discovery when we switch
 				 * to minmss.
 				 */
 				tp->t_flags2 &= ~TF2_PLPMTU_PMTUD;
 				KMOD_TCPSTAT_INC(tcps_pmtud_blackhole_activated_min_mss);
 			}
 #endif
 #if defined(INET6) && defined(INET)
 			else
 #endif
 #ifdef INET
 			if (tp->t_maxseg > V_tcp_pmtud_blackhole_mss) {
 				/* Use the sysctl tuneable blackhole MSS. */
 				tp->t_maxseg = V_tcp_pmtud_blackhole_mss;
 				KMOD_TCPSTAT_INC(tcps_pmtud_blackhole_activated);
 			} else {
 				/* Use the default MSS. */
 				tp->t_maxseg = V_tcp_mssdflt;
 				/*
 				 * Disable Path MTU Discovery when we switch
 				 * to minmss.
 				 */
 				tp->t_flags2 &= ~TF2_PLPMTU_PMTUD;
 				KMOD_TCPSTAT_INC(tcps_pmtud_blackhole_activated_min_mss);
 			}
 #endif
 		} else {
 			/*
 			 * If further retransmissions are still unsuccessful
 			 * with a lowered MTU, maybe this isn't a blackhole
 			 * and we restore the previous MSS and blackhole
 			 * detection flags. The limit '6' is determined by
 			 * giving each probe stage (1448, 1188, 524) 2
 			 * chances to recover.
 			 */
 			if ((tp->t_flags2 & TF2_PLPMTU_BLACKHOLE) &&
 			    (tp->t_rxtshift >= 6)) {
 				tp->t_flags2 |= TF2_PLPMTU_PMTUD;
 				tp->t_flags2 &= ~TF2_PLPMTU_BLACKHOLE;
 				tp->t_maxseg = tp->t_pmtud_saved_maxseg;
 				KMOD_TCPSTAT_INC(tcps_pmtud_blackhole_failed);
 			}
 		}
 	}
 	/*
 	 * Disable RFC1323 and SACK if we haven't got any response to our
 	 * third SYN to work-around some broken terminal servers (most of
 	 * which have hopefully been retired) that have bad VJ header
 	 * compression code which trashes TCP segments containing
 	 * unknown-to-them TCP options.
 	 */
 	if (tcp_rexmit_drop_options && (tp->t_state == TCPS_SYN_SENT) &&
 	    (tp->t_rxtshift == 3))
 		tp->t_flags &= ~(TF_REQ_SCALE | TF_REQ_TSTMP | TF_SACK_PERMIT);
 	/*
 	 * If we backed off this far, our srtt estimate is probably bogus.
 	 * Clobber it so we'll take the next rtt measurement as our srtt;
 	 * move the current srtt into rttvar to keep the current retransmit
 	 * times until then.
 	 */
 	if (tp->t_rxtshift > TCP_MAXRXTSHIFT / 4) {
 #ifdef INET6
 		if (bbr->r_is_v6)
 			in6_losing(inp);
 		else
 #endif
 			in_losing(inp);
 		tp->t_rttvar += (tp->t_srtt >> TCP_RTT_SHIFT);
 		tp->t_srtt = 0;
 	}
 	sack_filter_clear(&bbr->r_ctl.bbr_sf, tp->snd_una);
 	tp->snd_recover = tp->snd_max;
 	tp->t_flags |= TF_ACKNOW;
 	tp->t_rtttime = 0;
 
 	return (retval);
 }
 
 static int
 bbr_process_timers(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts, uint8_t hpts_calling)
 {
 	int32_t ret = 0;
 	int32_t timers = (bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK);
 
 	if (timers == 0) {
 		return (0);
 	}
 	if (tp->t_state == TCPS_LISTEN) {
 		/* no timers on listen sockets */
 		if (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT)
 			return (0);
 		return (1);
 	}
 	if (TSTMP_LT(cts, bbr->r_ctl.rc_timer_exp)) {
 		uint32_t left;
 
 		if (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) {
 			ret = -1;
 			bbr_log_to_processing(bbr, cts, ret, 0, hpts_calling);
 			return (0);
 		}
 		if (hpts_calling == 0) {
 			ret = -2;
 			bbr_log_to_processing(bbr, cts, ret, 0, hpts_calling);
 			return (0);
 		}
 		/*
 		 * Ok our timer went off early and we are not paced false
 		 * alarm, go back to sleep.
 		 */
 		left = bbr->r_ctl.rc_timer_exp - cts;
 		ret = -3;
 		bbr_log_to_processing(bbr, cts, ret, left, hpts_calling);
 		tcp_hpts_insert(tp, HPTS_USEC_TO_SLOTS(left));
 		return (1);
 	}
 	bbr->rc_tmr_stopped = 0;
 	bbr->r_ctl.rc_hpts_flags &= ~PACE_TMR_MASK;
 	if (timers & PACE_TMR_DELACK) {
 		ret = bbr_timeout_delack(tp, bbr, cts);
 	} else if (timers & PACE_TMR_PERSIT) {
 		ret = bbr_timeout_persist(tp, bbr, cts);
 	} else if (timers & PACE_TMR_RACK) {
 		bbr->r_ctl.rc_tlp_rxt_last_time = cts;
 		ret = bbr_timeout_rack(tp, bbr, cts);
 	} else if (timers & PACE_TMR_TLP) {
 		bbr->r_ctl.rc_tlp_rxt_last_time = cts;
 		ret = bbr_timeout_tlp(tp, bbr, cts);
 	} else if (timers & PACE_TMR_RXT) {
 		bbr->r_ctl.rc_tlp_rxt_last_time = cts;
 		ret = bbr_timeout_rxt(tp, bbr, cts);
 	} else if (timers & PACE_TMR_KEEP) {
 		ret = bbr_timeout_keepalive(tp, bbr, cts);
 	}
 	bbr_log_to_processing(bbr, cts, ret, timers, hpts_calling);
 	return (ret);
 }
 
 static void
 bbr_timer_cancel(struct tcp_bbr *bbr, int32_t line, uint32_t cts)
 {
 	if (bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK) {
 		uint8_t hpts_removed = 0;
 
 		if (tcp_in_hpts(bbr->rc_tp) &&
 		    (bbr->rc_timer_first == 1)) {
 			/*
 			 * If we are canceling timer's when we have the
 			 * timer ahead of the output being paced. We also
 			 * must remove ourselves from the hpts.
 			 */
 			hpts_removed = 1;
 			tcp_hpts_remove(bbr->rc_tp);
 			if (bbr->r_ctl.rc_last_delay_val) {
 				/* Update the last hptsi delay too */
 				uint32_t time_since_send;
 
 				if (TSTMP_GT(cts, bbr->rc_pacer_started))
 					time_since_send = cts - bbr->rc_pacer_started;
 				else
 					time_since_send = 0;
 				if (bbr->r_ctl.rc_last_delay_val > time_since_send) {
 					/* Cut down our slot time */
 					bbr->r_ctl.rc_last_delay_val -= time_since_send;
 				} else {
 					bbr->r_ctl.rc_last_delay_val = 0;
 				}
 				bbr->rc_pacer_started = cts;
 			}
 		}
 		bbr->rc_timer_first = 0;
 		bbr_log_to_cancel(bbr, line, cts, hpts_removed);
 		bbr->rc_tmr_stopped = bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK;
 		bbr->r_ctl.rc_hpts_flags &= ~(PACE_TMR_MASK);
 	}
 }
 
 static int
 bbr_stopall(struct tcpcb *tp)
 {
 	struct tcp_bbr *bbr;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	bbr->rc_all_timers_stopped = 1;
 	return (0);
 }
 
 static uint32_t
 bbr_get_earliest_send_outstanding(struct tcp_bbr *bbr, struct bbr_sendmap *u_rsm, uint32_t cts)
 {
 	struct bbr_sendmap *rsm;
 
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 	if ((rsm == NULL) || (u_rsm == rsm))
 		return (cts);
 	return(rsm->r_tim_lastsent[(rsm->r_rtr_cnt-1)]);
 }
 
 static void
 bbr_update_rsm(struct tcpcb *tp, struct tcp_bbr *bbr,
      struct bbr_sendmap *rsm, uint32_t cts, uint32_t pacing_time)
 {
 	int32_t idx;
 
 	rsm->r_rtr_cnt++;
 	rsm->r_dupack = 0;
 	if (rsm->r_rtr_cnt > BBR_NUM_OF_RETRANS) {
 		rsm->r_rtr_cnt = BBR_NUM_OF_RETRANS;
 		rsm->r_flags |= BBR_OVERMAX;
 	}
 	if (rsm->r_flags & BBR_RWND_COLLAPSED) {
 		/* Take off the collapsed flag at rxt */
 		rsm->r_flags &= ~BBR_RWND_COLLAPSED;
 	}
 	if (rsm->r_flags & BBR_MARKED_LOST) {
 		/* We have retransmitted, its no longer lost */
 		rsm->r_flags &= ~BBR_MARKED_LOST;
 		bbr->r_ctl.rc_lost_bytes -= rsm->r_end - rsm->r_start;
 	}
 	if (rsm->r_flags & BBR_RXT_CLEARED) {
 		/*
 		 * We hit a RXT timer on it and
 		 * we cleared the "acked" flag.
 		 * We now have it going back into
 		 * flight, we can remove the cleared
 		 * flag and possibly do accounting on
 		 * this piece.
 		 */
 		rsm->r_flags &= ~BBR_RXT_CLEARED;
 	}
 	if ((rsm->r_rtr_cnt > 1) && ((rsm->r_flags & BBR_TLP) == 0)) {
 		bbr->r_ctl.rc_holes_rxt += (rsm->r_end - rsm->r_start);
 		rsm->r_rtr_bytes += (rsm->r_end - rsm->r_start);
 	}
 	idx = rsm->r_rtr_cnt - 1;
 	rsm->r_tim_lastsent[idx] = cts;
 	rsm->r_pacing_delay = pacing_time;
 	rsm->r_delivered = bbr->r_ctl.rc_delivered;
 	rsm->r_ts_valid = bbr->rc_ts_valid;
 	if (bbr->rc_ts_valid)
 		rsm->r_del_ack_ts = bbr->r_ctl.last_inbound_ts;
 	if (bbr->r_ctl.r_app_limited_until)
 		rsm->r_app_limited = 1;
 	else
 		rsm->r_app_limited = 0;
 	if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW)
 		rsm->r_bbr_state = bbr_state_val(bbr);
 	else
 		rsm->r_bbr_state = 8;
 	if (rsm->r_flags & BBR_ACKED) {
 		/* Problably MTU discovery messing with us */
 		uint32_t old_flags;
 
 		old_flags = rsm->r_flags;
 		rsm->r_flags &= ~BBR_ACKED;
 		bbr_log_type_rsmclear(bbr, cts, rsm, old_flags, __LINE__);
 		bbr->r_ctl.rc_sacked -= (rsm->r_end - rsm->r_start);
 		if (bbr->r_ctl.rc_sacked == 0)
 			bbr->r_ctl.rc_sacklast = NULL;
 	}
 	if (rsm->r_in_tmap) {
 		TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 	}
 	TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 	rsm->r_in_tmap = 1;
 	if (rsm->r_flags & BBR_SACK_PASSED) {
 		/* We have retransmitted due to the SACK pass */
 		rsm->r_flags &= ~BBR_SACK_PASSED;
 		rsm->r_flags |= BBR_WAS_SACKPASS;
 	}
 	rsm->r_first_sent_time = bbr_get_earliest_send_outstanding(bbr, rsm, cts);
 	rsm->r_flight_at_send = ctf_flight_size(bbr->rc_tp,
 						(bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 	bbr->r_ctl.rc_next = TAILQ_NEXT(rsm, r_next);
 	if (bbr->r_ctl.rc_bbr_hptsi_gain > BBR_UNIT) {
 		rsm->r_is_gain = 1;
 		rsm->r_is_drain = 0;
 	} else if (bbr->r_ctl.rc_bbr_hptsi_gain < BBR_UNIT) {
 		rsm->r_is_drain = 1;
 		rsm->r_is_gain = 0;
 	} else {
 		rsm->r_is_drain = 0;
 		rsm->r_is_gain = 0;
 	}
 	rsm->r_del_time = bbr->r_ctl.rc_del_time; /* TEMP GOOGLE CODE */
 }
 
 /*
  * Returns 0, or the sequence where we stopped
  * updating. We also update the lenp to be the amount
  * of data left.
  */
 
 static uint32_t
 bbr_update_entry(struct tcpcb *tp, struct tcp_bbr *bbr,
     struct bbr_sendmap *rsm, uint32_t cts, int32_t *lenp, uint32_t pacing_time)
 {
 	/*
 	 * We (re-)transmitted starting at rsm->r_start for some length
 	 * (possibly less than r_end.
 	 */
 	struct bbr_sendmap *nrsm;
 	uint32_t c_end;
 	int32_t len;
 
 	len = *lenp;
 	c_end = rsm->r_start + len;
 	if (SEQ_GEQ(c_end, rsm->r_end)) {
 		/*
 		 * We retransmitted the whole piece or more than the whole
 		 * slopping into the next rsm.
 		 */
 		bbr_update_rsm(tp, bbr, rsm, cts, pacing_time);
 		if (c_end == rsm->r_end) {
 			*lenp = 0;
 			return (0);
 		} else {
 			int32_t act_len;
 
 			/* Hangs over the end return whats left */
 			act_len = rsm->r_end - rsm->r_start;
 			*lenp = (len - act_len);
 			return (rsm->r_end);
 		}
 		/* We don't get out of this block. */
 	}
 	/*
 	 * Here we retransmitted less than the whole thing which means we
 	 * have to split this into what was transmitted and what was not.
 	 */
 	nrsm = bbr_alloc_full_limit(bbr);
 	if (nrsm == NULL) {
 		*lenp = 0;
 		return (0);
 	}
 	/*
 	 * So here we are going to take the original rsm and make it what we
 	 * retransmitted. nrsm will be the tail portion we did not
 	 * retransmit. For example say the chunk was 1, 11 (10 bytes). And
 	 * we retransmitted 5 bytes i.e. 1, 5. The original piece shrinks to
 	 * 1, 6 and the new piece will be 6, 11.
 	 */
 	bbr_clone_rsm(bbr, nrsm, rsm, c_end);
 	TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 	nrsm->r_dupack = 0;
 	if (rsm->r_in_tmap) {
 		TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 		nrsm->r_in_tmap = 1;
 	}
 	rsm->r_flags &= (~BBR_HAS_FIN);
 	bbr_update_rsm(tp, bbr, rsm, cts, pacing_time);
 	*lenp = 0;
 	return (0);
 }
 
 static uint64_t
 bbr_get_hardware_rate(struct tcp_bbr *bbr)
 {
 	uint64_t bw;
 
 	bw = bbr_get_bw(bbr);
 	bw *= (uint64_t)bbr_hptsi_gain[BBR_SUB_GAIN];
 	bw /= (uint64_t)BBR_UNIT;
 	return(bw);
 }
 
 static void
 bbr_setup_less_of_rate(struct tcp_bbr *bbr, uint32_t cts,
 		       uint64_t act_rate, uint64_t rate_wanted)
 {
 	/*
 	 * We could not get a full gains worth
 	 * of rate.
 	 */
 	if (get_filter_value(&bbr->r_ctl.rc_delrate) >= act_rate) {
 		/* we can't even get the real rate */
 		uint64_t red;
 
 		bbr->skip_gain = 1;
 		bbr->gain_is_limited = 0;
 		red = get_filter_value(&bbr->r_ctl.rc_delrate) - act_rate;
 		if (red)
 			filter_reduce_by(&bbr->r_ctl.rc_delrate, red, cts);
 	} else {
 		/* We can use a lower gain */
 		bbr->skip_gain = 0;
 		bbr->gain_is_limited = 1;
 	}
 }
 
 static void
 bbr_update_hardware_pacing_rate(struct tcp_bbr *bbr, uint32_t cts)
 {
 	const struct tcp_hwrate_limit_table *nrte;
 	int error, rate = -1;
 
 	if (bbr->r_ctl.crte == NULL)
 		return;
 	if ((bbr->rc_inp->inp_route.ro_nh == NULL) ||
 	    (bbr->rc_inp->inp_route.ro_nh->nh_ifp == NULL)) {
 		/* Lost our routes? */
 		/* Clear the way for a re-attempt */
 		bbr->bbr_attempt_hdwr_pace = 0;
 lost_rate:
 		bbr->gain_is_limited = 0;
 		bbr->skip_gain = 0;
 		bbr->bbr_hdrw_pacing = 0;
 		counter_u64_add(bbr_flows_whdwr_pacing, -1);
 		counter_u64_add(bbr_flows_nohdwr_pacing, 1);
 		tcp_bbr_tso_size_check(bbr, cts);
 		return;
 	}
 	rate = bbr_get_hardware_rate(bbr);
 	nrte = tcp_chg_pacing_rate(bbr->r_ctl.crte,
 				   bbr->rc_tp,
 				   bbr->rc_inp->inp_route.ro_nh->nh_ifp,
 				   rate,
 				   (RS_PACING_GEQ|RS_PACING_SUB_OK),
 				   &error, NULL);
 	if (nrte == NULL) {
 		goto lost_rate;
 	}
 	if (nrte != bbr->r_ctl.crte) {
 		bbr->r_ctl.crte = nrte;
 		if (error == 0)  {
 			BBR_STAT_INC(bbr_hdwr_rl_mod_ok);
 			if (bbr->r_ctl.crte->rate < rate) {
 				/* We have a problem */
 				bbr_setup_less_of_rate(bbr, cts,
 						       bbr->r_ctl.crte->rate, rate);
 			} else {
 				/* We are good */
 				bbr->gain_is_limited = 0;
 				bbr->skip_gain = 0;
 			}
 		} else {
 			/* A failure should release the tag */
 			BBR_STAT_INC(bbr_hdwr_rl_mod_fail);
 			bbr->gain_is_limited = 0;
 			bbr->skip_gain = 0;
 			bbr->bbr_hdrw_pacing = 0;
 		}
 		bbr_type_log_hdwr_pacing(bbr,
 					 bbr->r_ctl.crte->ptbl->rs_ifp,
 					 rate,
 					 ((bbr->r_ctl.crte == NULL) ? 0 : bbr->r_ctl.crte->rate),
 					 __LINE__,
 					 cts,
 					 error);
 	}
 }
 
 static void
 bbr_adjust_for_hw_pacing(struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * If we have hardware pacing support
 	 * we need to factor that in for our
 	 * TSO size.
 	 */
 	const struct tcp_hwrate_limit_table *rlp;
 	uint32_t cur_delay, seg_sz, maxseg, new_tso, delta, hdwr_delay;
 
 	if ((bbr->bbr_hdrw_pacing == 0) ||
 	    (IN_RECOVERY(bbr->rc_tp->t_flags)) ||
 	    (bbr->r_ctl.crte == NULL))
 		return;
 	if (bbr->hw_pacing_set == 0) {
 		/* Not yet by the hdwr pacing count delay */
 		return;
 	}
 	if (bbr_hdwr_pace_adjust == 0) {
 		/* No adjustment */
 		return;
 	}
 	rlp = bbr->r_ctl.crte;
 	if (bbr->rc_tp->t_maxseg > bbr->rc_last_options)
 		maxseg = bbr->rc_tp->t_maxseg - bbr->rc_last_options;
 	else
 		maxseg = BBR_MIN_SEG - bbr->rc_last_options;
 	/*
 	 * So lets first get the
 	 * time we will take between
 	 * TSO sized sends currently without
 	 * hardware help.
 	 */
 	cur_delay = bbr_get_pacing_delay(bbr, BBR_UNIT,
 		        bbr->r_ctl.rc_pace_max_segs, cts, 1);
 	hdwr_delay = bbr->r_ctl.rc_pace_max_segs / maxseg;
 	hdwr_delay *= rlp->time_between;
 	if (cur_delay > hdwr_delay)
 		delta = cur_delay - hdwr_delay;
 	else
 		delta = 0;
 	bbr_log_type_tsosize(bbr, cts, delta, cur_delay, hdwr_delay,
 			     (bbr->r_ctl.rc_pace_max_segs / maxseg),
 			     1);
 	if (delta &&
 	    (delta < (max(rlp->time_between,
 			  bbr->r_ctl.bbr_hptsi_segments_delay_tar)))) {
 		/*
 		 * Now lets divide by the pacing
 		 * time between each segment the
 		 * hardware sends rounding up and
 		 * derive a bytes from that. We multiply
 		 * that by bbr_hdwr_pace_adjust to get
 		 * more bang for our buck.
 		 *
 		 * The goal is to have the software pacer
 		 * waiting no more than an additional
 		 * pacing delay if we can (without the
 		 * compensation i.e. x bbr_hdwr_pace_adjust).
 		 */
 		seg_sz = max(((cur_delay + rlp->time_between)/rlp->time_between),
 			     (bbr->r_ctl.rc_pace_max_segs/maxseg));
 		seg_sz *= bbr_hdwr_pace_adjust;
 		if (bbr_hdwr_pace_floor &&
 		    (seg_sz < bbr->r_ctl.crte->ptbl->rs_min_seg)) {
 			/* Currently hardware paces
 			 * out rs_min_seg segments at a time.
 			 * We need to make sure we always send at least
 			 * a full burst of bbr_hdwr_pace_floor down.
 			 */
 			seg_sz = bbr->r_ctl.crte->ptbl->rs_min_seg;
 		}
 		seg_sz *= maxseg;
 	} else if (delta == 0) {
 		/*
 		 * The highest pacing rate is
 		 * above our b/w gained. This means
 		 * we probably are going quite fast at
 		 * the hardware highest rate. Lets just multiply
 		 * the calculated TSO size by the
 		 * multiplier factor (its probably
 		 * 4 segments in the default config for
 		 * mlx).
 		 */
 		seg_sz = bbr->r_ctl.rc_pace_max_segs * bbr_hdwr_pace_adjust;
 		if (bbr_hdwr_pace_floor &&
 		    (seg_sz < bbr->r_ctl.crte->ptbl->rs_min_seg)) {
 			/* Currently hardware paces
 			 * out rs_min_seg segments at a time.
 			 * We need to make sure we always send at least
 			 * a full burst of bbr_hdwr_pace_floor down.
 			 */
 			seg_sz = bbr->r_ctl.crte->ptbl->rs_min_seg;
 		}
 	} else {
 		/*
 		 * The pacing time difference is so
 		 * big that the hardware will
 		 * pace out more rapidly then we
 		 * really want and then we
 		 * will have a long delay. Lets just keep
 		 * the same TSO size so its as if
 		 * we were not using hdwr pacing (we
 		 * just gain a bit of spacing from the
 		 * hardware if seg_sz > 1).
 		 */
 		seg_sz = bbr->r_ctl.rc_pace_max_segs;
 	}
 	if (seg_sz > bbr->r_ctl.rc_pace_max_segs)
 		new_tso = seg_sz;
 	else
 		new_tso = bbr->r_ctl.rc_pace_max_segs;
 	if (new_tso >= (PACE_MAX_IP_BYTES-maxseg))
 		new_tso = PACE_MAX_IP_BYTES - maxseg;
 
 	if (new_tso != bbr->r_ctl.rc_pace_max_segs) {
 		bbr_log_type_tsosize(bbr, cts, new_tso, 0, bbr->r_ctl.rc_pace_max_segs, maxseg, 0);
 		bbr->r_ctl.rc_pace_max_segs = new_tso;
 	}
 }
 
 static void
 tcp_bbr_tso_size_check(struct tcp_bbr *bbr, uint32_t cts)
 {
 	uint64_t bw;
 	uint32_t old_tso = 0, new_tso;
 	uint32_t maxseg, bytes;
 	uint32_t tls_seg=0;
 	/*
 	 * Google/linux uses the following algorithm to determine
 	 * the TSO size based on the b/w of the link (from Neal Cardwell email 9/27/18):
 	 *
 	 *  bytes = bw_in_bytes_per_second / 1000
 	 *  bytes = min(bytes, 64k)
 	 *  tso_segs = bytes / MSS
 	 *  if (bw < 1.2Mbs)
 	 *      min_tso_segs = 1
 	 *  else
 	 *	min_tso_segs = 2
 	 * tso_segs = max(tso_segs, min_tso_segs)
 	 *
 	 * * Note apply a device specific limit (we apply this in the
 	 *   tcp_m_copym).
 	 * Note that before the initial measurement is made google bursts out
 	 * a full iwnd just like new-reno/cubic.
 	 *
 	 * We do not use this algorithm. Instead we
 	 * use a two phased approach:
 	 *
 	 *  if ( bw <= per-tcb-cross-over)
 	 *     goal_tso =  calculate how much with this bw we
 	 *                 can send in goal-time seconds.
 	 *     if (goal_tso > mss)
 	 *         seg = goal_tso / mss
 	 *         tso = seg * mss
 	 *     else
 	 *         tso = mss
 	 *     if (tso > per-tcb-max)
 	 *         tso = per-tcb-max
 	 *  else if ( bw > 512Mbps)
 	 *     tso = max-tso (64k/mss)
 	 *  else
 	 *     goal_tso = bw / per-tcb-divsor
 	 *     seg = (goal_tso + mss-1)/mss
 	 *     tso = seg * mss
 	 *
 	 * if (tso < per-tcb-floor)
 	 *    tso = per-tcb-floor
 	 * if (tso > per-tcb-utter_max)
 	 *    tso = per-tcb-utter_max
 	 *
 	 * Note the default per-tcb-divisor is 1000 (same as google).
 	 * the goal cross over is 30Mbps however. To recreate googles
 	 * algorithm you need to set:
 	 *
 	 * cross-over = 23,168,000 bps
 	 * goal-time = 18000
 	 * per-tcb-max = 2
 	 * per-tcb-divisor = 1000
 	 * per-tcb-floor = 1
 	 *
 	 * This will get you "google bbr" behavior with respect to tso size.
 	 *
 	 * Note we do set anything TSO size until we are past the initial
 	 * window. Before that we gnerally use either a single MSS
 	 * or we use the full IW size (so we burst a IW at a time)
 	 */
 
 	if (bbr->rc_tp->t_maxseg > bbr->rc_last_options) {
 		maxseg = bbr->rc_tp->t_maxseg - bbr->rc_last_options;
 	} else {
 		maxseg = BBR_MIN_SEG - bbr->rc_last_options;
 	}
 	old_tso = bbr->r_ctl.rc_pace_max_segs;
 	if (bbr->rc_past_init_win == 0) {
 		/*
 		 * Not enough data has been acknowledged to make a
 		 * judgement. Set up the initial TSO based on if we
 		 * are sending a full IW at once or not.
 		 */
 		if (bbr->rc_use_google)
 			bbr->r_ctl.rc_pace_max_segs = ((bbr->rc_tp->t_maxseg - bbr->rc_last_options) * 2);
 		else if (bbr->bbr_init_win_cheat)
 			bbr->r_ctl.rc_pace_max_segs = bbr_initial_cwnd(bbr, bbr->rc_tp);
 		else
 			bbr->r_ctl.rc_pace_max_segs = bbr->rc_tp->t_maxseg - bbr->rc_last_options;
 		if (bbr->r_ctl.rc_pace_min_segs != bbr->rc_tp->t_maxseg)
 			bbr->r_ctl.rc_pace_min_segs = bbr->rc_tp->t_maxseg;
 		if (bbr->r_ctl.rc_pace_max_segs == 0) {
 			bbr->r_ctl.rc_pace_max_segs = maxseg;
 		}
 		bbr_log_type_tsosize(bbr, cts, bbr->r_ctl.rc_pace_max_segs, tls_seg, old_tso, maxseg, 0);
 			bbr_adjust_for_hw_pacing(bbr, cts);
 		return;
 	}
 	/**
 	 * Now lets set the TSO goal based on our delivery rate in
 	 * bytes per second. Note we only do this if
 	 * we have acked at least the initial cwnd worth of data.
 	 */
 	bw = bbr_get_bw(bbr);
 	if (IN_RECOVERY(bbr->rc_tp->t_flags) &&
 	     (bbr->rc_use_google == 0)) {
 		/* We clamp to one MSS in recovery */
 		new_tso = maxseg;
 	} else if (bbr->rc_use_google) {
 		int min_tso_segs;
 
 		/* Google considers the gain too */
 		if (bbr->r_ctl.rc_bbr_hptsi_gain != BBR_UNIT) {
 			bw *= bbr->r_ctl.rc_bbr_hptsi_gain;
 			bw /= BBR_UNIT;
 		}
 		bytes = bw / 1024;
 		if (bytes > (64 * 1024))
 			bytes = 64 * 1024;
 		new_tso = bytes / maxseg;
 		if (bw < ONE_POINT_TWO_MEG)
 			min_tso_segs = 1;
 		else
 			min_tso_segs = 2;
 		if (new_tso < min_tso_segs)
 			new_tso = min_tso_segs;
 		new_tso *= maxseg;
 	} else if (bbr->rc_no_pacing) {
 		new_tso = (PACE_MAX_IP_BYTES / maxseg) * maxseg;
 	} else if (bw <= bbr->r_ctl.bbr_cross_over) {
 		/*
 		 * Calculate the worse case b/w TSO if we are inserting no
 		 * more than a delay_target number of TSO's.
 		 */
 		uint32_t tso_len, min_tso;
 
 		tso_len = bbr_get_pacing_length(bbr, BBR_UNIT, bbr->r_ctl.bbr_hptsi_segments_delay_tar, bw);
 		if (tso_len > maxseg) {
 			new_tso = tso_len / maxseg;
 			if (new_tso > bbr->r_ctl.bbr_hptsi_segments_max)
 				new_tso = bbr->r_ctl.bbr_hptsi_segments_max;
 			new_tso *= maxseg;
 		} else {
 			/*
 			 * less than a full sized frame yikes.. long rtt or
 			 * low bw?
 			 */
 			min_tso = bbr_minseg(bbr);
 			if ((tso_len > min_tso) && (bbr_all_get_min == 0))
 				new_tso = rounddown(tso_len, min_tso);
 			else
 				new_tso = min_tso;
 		}
 	} else if (bw > FIVETWELVE_MBPS) {
 		/*
 		 * This guy is so fast b/w wise that we can TSO as large as
 		 * possible of segments that the NIC will allow.
 		 */
 		new_tso = rounddown(PACE_MAX_IP_BYTES, maxseg);
 	} else {
 		/*
 		 * This formula is based on attempting to send a segment or
 		 * more every bbr_hptsi_per_second. The default is 1000
 		 * which means you are targeting what you can send every 1ms
 		 * based on the peers bw.
 		 *
 		 * If the number drops to say 500, then you are looking more
 		 * at 2ms and you will raise how much we send in a single
 		 * TSO thus saving CPU (less bbr_output_wtime() calls). The
 		 * trade off of course is you will send more at once and
 		 * thus tend to clump up the sends into larger "bursts"
 		 * building a queue.
 		 */
 		bw /= bbr->r_ctl.bbr_hptsi_per_second;
 		new_tso = roundup(bw, (uint64_t)maxseg);
 		/*
 		 * Gate the floor to match what our lower than 48Mbps
 		 * algorithm does. The ceiling (bbr_hptsi_segments_max) thus
 		 * becomes the floor for this calculation.
 		 */
 		if (new_tso < (bbr->r_ctl.bbr_hptsi_segments_max * maxseg))
 			new_tso = (bbr->r_ctl.bbr_hptsi_segments_max * maxseg);
 	}
 	if (bbr->r_ctl.bbr_hptsi_segments_floor && (new_tso < (maxseg * bbr->r_ctl.bbr_hptsi_segments_floor)))
 		new_tso = maxseg * bbr->r_ctl.bbr_hptsi_segments_floor;
 	if (new_tso > PACE_MAX_IP_BYTES)
 		new_tso = rounddown(PACE_MAX_IP_BYTES, maxseg);
 	/* Enforce an utter maximum. */
 	if (bbr->r_ctl.bbr_utter_max && (new_tso > (bbr->r_ctl.bbr_utter_max * maxseg))) {
 		new_tso = bbr->r_ctl.bbr_utter_max * maxseg;
 	}
 	if (old_tso != new_tso) {
 		/* Only log changes */
 		bbr_log_type_tsosize(bbr, cts, new_tso, tls_seg, old_tso, maxseg, 0);
 		bbr->r_ctl.rc_pace_max_segs = new_tso;
 	}
 	/* We have hardware pacing! */
 	bbr_adjust_for_hw_pacing(bbr, cts);
 }
 
 static void
 bbr_log_output(struct tcp_bbr *bbr, struct tcpcb *tp, struct tcpopt *to, int32_t len,
     uint32_t seq_out, uint16_t th_flags, int32_t err, uint32_t cts,
     struct mbuf *mb, int32_t * abandon, struct bbr_sendmap *hintrsm, uint32_t delay_calc,
     struct sockbuf *sb)
 {
 
 	struct bbr_sendmap *rsm, *nrsm;
 	register uint32_t snd_max, snd_una;
 	uint32_t pacing_time;
 	/*
 	 * Add to the RACK log of packets in flight or retransmitted. If
 	 * there is a TS option we will use the TS echoed, if not we will
 	 * grab a TS.
 	 *
 	 * Retransmissions will increment the count and move the ts to its
 	 * proper place. Note that if options do not include TS's then we
 	 * won't be able to effectively use the ACK for an RTT on a retran.
 	 *
 	 * Notes about r_start and r_end. Lets consider a send starting at
 	 * sequence 1 for 10 bytes. In such an example the r_start would be
 	 * 1 (starting sequence) but the r_end would be r_start+len i.e. 11.
 	 * This means that r_end is actually the first sequence for the next
 	 * slot (11).
 	 *
 	 */
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (err) {
 		/*
 		 * We don't log errors -- we could but snd_max does not
 		 * advance in this case either.
 		 */
 		return;
 	}
 	if (th_flags & TH_RST) {
 		/*
 		 * We don't log resets and we return immediately from
 		 * sending
 		 */
 		*abandon = 1;
 		return;
 	}
 	snd_una = tp->snd_una;
 	if (th_flags & (TH_SYN | TH_FIN) && (hintrsm == NULL)) {
 		/*
 		 * The call to bbr_log_output is made before bumping
 		 * snd_max. This means we can record one extra byte on a SYN
 		 * or FIN if seq_out is adding more on and a FIN is present
 		 * (and we are not resending).
 		 */
 		if ((th_flags & TH_SYN) && (tp->iss == seq_out))
 			len++;
 		if (th_flags & TH_FIN)
 			len++;
 	}
 	if (SEQ_LEQ((seq_out + len), snd_una)) {
 		/* Are sending an old segment to induce an ack (keep-alive)? */
 		return;
 	}
 	if (SEQ_LT(seq_out, snd_una)) {
 		/* huh? should we panic? */
 		uint32_t end;
 
 		end = seq_out + len;
 		seq_out = snd_una;
 		len = end - seq_out;
 	}
 	snd_max = tp->snd_max;
 	if (len == 0) {
 		/* We don't log zero window probes */
 		return;
 	}
 	pacing_time = bbr_get_pacing_delay(bbr, bbr->r_ctl.rc_bbr_hptsi_gain, len, cts, 1);
 	/* First question is it a retransmission? */
 	if (seq_out == snd_max) {
 again:
 		rsm = bbr_alloc(bbr);
 		if (rsm == NULL) {
 			return;
 		}
 		rsm->r_flags = 0;
 		if (th_flags & TH_SYN)
 			rsm->r_flags |= BBR_HAS_SYN;
 		if (th_flags & TH_FIN)
 			rsm->r_flags |= BBR_HAS_FIN;
 		rsm->r_tim_lastsent[0] = cts;
 		rsm->r_rtr_cnt = 1;
 		rsm->r_rtr_bytes = 0;
 		rsm->r_start = seq_out;
 		rsm->r_end = rsm->r_start + len;
 		rsm->r_dupack = 0;
 		rsm->r_delivered = bbr->r_ctl.rc_delivered;
 		rsm->r_pacing_delay = pacing_time;
 		rsm->r_ts_valid = bbr->rc_ts_valid;
 		if (bbr->rc_ts_valid)
 			rsm->r_del_ack_ts = bbr->r_ctl.last_inbound_ts;
 		rsm->r_del_time = bbr->r_ctl.rc_del_time;
 		if (bbr->r_ctl.r_app_limited_until)
 			rsm->r_app_limited = 1;
 		else
 			rsm->r_app_limited = 0;
 		rsm->r_first_sent_time = bbr_get_earliest_send_outstanding(bbr, rsm, cts);
 		rsm->r_flight_at_send = ctf_flight_size(bbr->rc_tp,
 						(bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		/*
 		 * Here we must also add in this rsm since snd_max
 		 * is updated after we return from a new send.
 		 */
 		rsm->r_flight_at_send += len;
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_map, rsm, r_next);
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 		rsm->r_in_tmap = 1;
 		if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW)
 			rsm->r_bbr_state = bbr_state_val(bbr);
 		else
 			rsm->r_bbr_state = 8;
 		if (bbr->r_ctl.rc_bbr_hptsi_gain > BBR_UNIT) {
 			rsm->r_is_gain = 1;
 			rsm->r_is_drain = 0;
 		} else if (bbr->r_ctl.rc_bbr_hptsi_gain < BBR_UNIT) {
 			rsm->r_is_drain = 1;
 			rsm->r_is_gain = 0;
 		} else {
 			rsm->r_is_drain = 0;
 			rsm->r_is_gain = 0;
 		}
 		return;
 	}
 	/*
 	 * If we reach here its a retransmission and we need to find it.
 	 */
 more:
 	if (hintrsm && (hintrsm->r_start == seq_out)) {
 		rsm = hintrsm;
 		hintrsm = NULL;
 	} else if (bbr->r_ctl.rc_next) {
 		/* We have a hint from a previous run */
 		rsm = bbr->r_ctl.rc_next;
 	} else {
 		/* No hints sorry */
 		rsm = NULL;
 	}
 	if ((rsm) && (rsm->r_start == seq_out)) {
 		/*
 		 * We used rc_next or hintrsm  to retransmit, hopefully the
 		 * likely case.
 		 */
 		seq_out = bbr_update_entry(tp, bbr, rsm, cts, &len, pacing_time);
 		if (len == 0) {
 			return;
 		} else {
 			goto more;
 		}
 	}
 	/* Ok it was not the last pointer go through it the hard way. */
 	TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_map, r_next) {
 		if (rsm->r_start == seq_out) {
 			seq_out = bbr_update_entry(tp, bbr, rsm, cts, &len, pacing_time);
 			bbr->r_ctl.rc_next = TAILQ_NEXT(rsm, r_next);
 			if (len == 0) {
 				return;
 			} else {
 				continue;
 			}
 		}
 		if (SEQ_GEQ(seq_out, rsm->r_start) && SEQ_LT(seq_out, rsm->r_end)) {
 			/* Transmitted within this piece */
 			/*
 			 * Ok we must split off the front and then let the
 			 * update do the rest
 			 */
 			nrsm = bbr_alloc_full_limit(bbr);
 			if (nrsm == NULL) {
 				bbr_update_rsm(tp, bbr, rsm, cts, pacing_time);
 				return;
 			}
 			/*
 			 * copy rsm to nrsm and then trim the front of rsm
 			 * to not include this part.
 			 */
 			bbr_clone_rsm(bbr, nrsm, rsm, seq_out);
 			TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 			if (rsm->r_in_tmap) {
 				TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 				nrsm->r_in_tmap = 1;
 			}
 			rsm->r_flags &= (~BBR_HAS_FIN);
 			seq_out = bbr_update_entry(tp, bbr, nrsm, cts, &len, pacing_time);
 			if (len == 0) {
 				return;
 			}
 		}
 	}
 	/*
 	 * Hmm not found in map did they retransmit both old and on into the
 	 * new?
 	 */
 	if (seq_out == tp->snd_max) {
 		goto again;
 	} else if (SEQ_LT(seq_out, tp->snd_max)) {
 #ifdef BBR_INVARIANTS
 		printf("seq_out:%u len:%d snd_una:%u snd_max:%u -- but rsm not found?\n",
 		    seq_out, len, tp->snd_una, tp->snd_max);
 		printf("Starting Dump of all rack entries\n");
 		TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_map, r_next) {
 			printf("rsm:%p start:%u end:%u\n",
 			    rsm, rsm->r_start, rsm->r_end);
 		}
 		printf("Dump complete\n");
 		panic("seq_out not found rack:%p tp:%p",
 		    bbr, tp);
 #endif
 	} else {
 #ifdef BBR_INVARIANTS
 		/*
 		 * Hmm beyond sndmax? (only if we are using the new rtt-pack
 		 * flag)
 		 */
 		panic("seq_out:%u(%d) is beyond snd_max:%u tp:%p",
 		    seq_out, len, tp->snd_max, tp);
 #endif
 	}
 }
 
 static void
 bbr_collapse_rtt(struct tcpcb *tp, struct tcp_bbr *bbr, int32_t rtt)
 {
 	/*
 	 * Collapse timeout back the cum-ack moved.
 	 */
 	tp->t_rxtshift = 0;
 	tp->t_softerror = 0;
 }
 
 static void
 tcp_bbr_xmit_timer(struct tcp_bbr *bbr, uint32_t rtt_usecs, uint32_t rsm_send_time, uint32_t r_start, uint32_t tsin)
 {
 	bbr->rtt_valid = 1;
 	bbr->r_ctl.cur_rtt = rtt_usecs;
 	bbr->r_ctl.ts_in = tsin;
 	if (rsm_send_time)
 		bbr->r_ctl.cur_rtt_send_time = rsm_send_time;
 }
 
 static void
 bbr_make_timestamp_determination(struct tcp_bbr *bbr)
 {
 	/**
 	 * We have in our bbr control:
 	 * 1) The timestamp we started observing cum-acks (bbr->r_ctl.bbr_ts_check_tstmp).
 	 * 2) Our timestamp indicating when we sent that packet (bbr->r_ctl.rsm->bbr_ts_check_our_cts).
 	 * 3) The current timestamp that just came in (bbr->r_ctl.last_inbound_ts)
 	 * 4) The time that the packet that generated that ack was sent (bbr->r_ctl.cur_rtt_send_time)
 	 *
 	 * Now we can calculate the time between the sends by doing:
 	 *
 	 * delta = bbr->r_ctl.cur_rtt_send_time - bbr->r_ctl.bbr_ts_check_our_cts
 	 *
 	 * And the peer's time between receiving them by doing:
 	 *
 	 * peer_delta = bbr->r_ctl.last_inbound_ts - bbr->r_ctl.bbr_ts_check_tstmp
 	 *
 	 * We want to figure out if the timestamp values are in msec, 10msec or usec.
 	 * We also may find that we can't use the timestamps if say we see
 	 * that the peer_delta indicates that though we may have taken 10ms to
 	 * pace out the data, it only saw 1ms between the two packets. This would
 	 * indicate that somewhere on the path is a batching entity that is giving
 	 * out time-slices of the actual b/w. This would mean we could not use
 	 * reliably the peers timestamps.
 	 *
 	 * We expect delta > peer_delta initially. Until we figure out the
 	 * timestamp difference which we will store in bbr->r_ctl.bbr_peer_tsratio.
 	 * If we place 1000 there then its a ms vs our usec. If we place 10000 there
 	 * then its 10ms vs our usec. If the peer is running a usec clock we would
 	 * put a 1 there. If the value is faster then ours, we will disable the
 	 * use of timestamps (though we could revist this later if we find it to be not
 	 * just an isolated one or two flows)).
 	 *
 	 * To detect the batching middle boxes we will come up with our compensation and
 	 * if with it in place, we find the peer is drastically off (by some margin) in
 	 * the smaller direction, then we will assume the worst case and disable use of timestamps.
 	 *
 	 */
 	uint64_t delta, peer_delta, delta_up;
 
 	delta = bbr->r_ctl.cur_rtt_send_time - bbr->r_ctl.bbr_ts_check_our_cts;
 	if (delta < bbr_min_usec_delta) {
 		/*
 		 * Have not seen a min amount of time
 		 * between our send times so we can
 		 * make a determination of the timestamp
 		 * yet.
 		 */
 		return;
 	}
 	peer_delta = bbr->r_ctl.last_inbound_ts - bbr->r_ctl.bbr_ts_check_tstmp;
 	if (peer_delta < bbr_min_peer_delta) {
 		/*
 		 * We may have enough in the form of
 		 * our delta but the peers number
 		 * has not changed that much. It could
 		 * be its clock ratio is such that
 		 * we need more data (10ms tick) or
 		 * there may be other compression scenarios
 		 * going on. In any event we need the
 		 * spread to be larger.
 		 */
 		return;
 	}
 	/* Ok lets first see which way our delta is going */
 	if (peer_delta > delta) {
 		/* Very unlikely, the peer without
 		 * compensation shows that it saw
 		 * the two sends arrive further apart
 		 * then we saw then in micro-seconds.
 		 */
 		if (peer_delta < (delta + ((delta * (uint64_t)1000)/ (uint64_t)bbr_delta_percent))) {
 			/* well it looks like the peer is a micro-second clock. */
 			bbr->rc_ts_clock_set = 1;
 			bbr->r_ctl.bbr_peer_tsratio = 1;
 		} else {
 			bbr->rc_ts_cant_be_used = 1;
 			bbr->rc_ts_clock_set = 1;
 		}
 		return;
 	}
 	/* Ok we know that the peer_delta is smaller than our send distance */
 	bbr->rc_ts_clock_set = 1;
 	/* First question is it within the percentage that they are using usec time? */
 	delta_up = (peer_delta * 1000) / (uint64_t)bbr_delta_percent;
 	if ((peer_delta + delta_up) >= delta) {
 		/* Its a usec clock */
 		bbr->r_ctl.bbr_peer_tsratio = 1;
 		bbr_log_tstmp_validation(bbr, peer_delta, delta);
 		return;
 	}
 	/* Ok if not usec, what about 10usec (though unlikely)? */
 	delta_up = (peer_delta * 1000 * 10) / (uint64_t)bbr_delta_percent;
 	if (((peer_delta * 10) + delta_up) >= delta) {
 		bbr->r_ctl.bbr_peer_tsratio = 10;
 		bbr_log_tstmp_validation(bbr, peer_delta, delta);
 		return;
 	}
 	/* And what about 100usec (though again unlikely)? */
 	delta_up = (peer_delta * 1000 * 100) / (uint64_t)bbr_delta_percent;
 	if (((peer_delta * 100) + delta_up) >= delta) {
 		bbr->r_ctl.bbr_peer_tsratio = 100;
 		bbr_log_tstmp_validation(bbr, peer_delta, delta);
 		return;
 	}
 	/* And how about 1 msec (the most likely one)? */
 	delta_up = (peer_delta * 1000 * 1000) / (uint64_t)bbr_delta_percent;
 	if (((peer_delta * 1000) + delta_up) >= delta) {
 		bbr->r_ctl.bbr_peer_tsratio = 1000;
 		bbr_log_tstmp_validation(bbr, peer_delta, delta);
 		return;
 	}
 	/* Ok if not msec could it be 10 msec? */
 	delta_up = (peer_delta * 1000 * 10000) / (uint64_t)bbr_delta_percent;
 	if (((peer_delta * 10000) + delta_up) >= delta) {
 		bbr->r_ctl.bbr_peer_tsratio = 10000;
 		return;
 	}
 	/* If we fall down here the clock tick so slowly we can't use it */
 	bbr->rc_ts_cant_be_used = 1;
 	bbr->r_ctl.bbr_peer_tsratio = 0;
 	bbr_log_tstmp_validation(bbr, peer_delta, delta);
 }
 
 /*
  * Collect new round-trip time estimate
  * and update averages and current timeout.
  */
 static void
 tcp_bbr_xmit_timer_commit(struct tcp_bbr *bbr, struct tcpcb *tp, uint32_t cts)
 {
 	int32_t delta;
 	uint32_t rtt, tsin;
 	int32_t rtt_ticks;
 
 	if (bbr->rtt_valid == 0)
 		/* No valid sample */
 		return;
 
 	rtt = bbr->r_ctl.cur_rtt;
 	tsin = bbr->r_ctl.ts_in;
 	if (bbr->rc_prtt_set_ts) {
 		/*
 		 * We are to force feed the rttProp filter due
 		 * to an entry into PROBE_RTT. This assures
 		 * that the times are sync'd between when we
 		 * go into PROBE_RTT and the filter expiration.
 		 *
 		 * Google does not use a true filter, so they do
 		 * this implicitly since they only keep one value
 		 * and when they enter probe-rtt they update the
 		 * value to the newest rtt.
 		 */
 		uint32_t rtt_prop;
 
 		bbr->rc_prtt_set_ts = 0;
 		rtt_prop = get_filter_value_small(&bbr->r_ctl.rc_rttprop);
 		if (rtt > rtt_prop)
 			filter_increase_by_small(&bbr->r_ctl.rc_rttprop, (rtt - rtt_prop), cts);
 		else
 			apply_filter_min_small(&bbr->r_ctl.rc_rttprop, rtt, cts);
 	}
 #ifdef STATS
 	stats_voi_update_abs_u32(tp->t_stats, VOI_TCP_PATHRTT, imax(0, rtt));
 #endif
 	if (bbr->rc_ack_was_delayed)
 		rtt += bbr->r_ctl.rc_ack_hdwr_delay;
 
 	if (rtt < bbr->r_ctl.rc_lowest_rtt)
 		bbr->r_ctl.rc_lowest_rtt = rtt;
 	bbr_log_rtt_sample(bbr, rtt, tsin);
 	if (bbr->r_init_rtt) {
 		/*
 		 * The initial rtt is not-trusted, nuke it and lets get
 		 * our first valid measurement in.
 		 */
 		bbr->r_init_rtt = 0;
 		tp->t_srtt = 0;
 	}
 	if ((bbr->rc_ts_clock_set == 0) && bbr->rc_ts_valid) {
 		/*
 		 * So we have not yet figured out
 		 * what the peers TSTMP value is
 		 * in (most likely ms). We need a
 		 * series of cum-ack's to determine
 		 * this reliably.
 		 */
 		if (bbr->rc_ack_is_cumack) {
 			if (bbr->rc_ts_data_set) {
 				/* Lets attempt to determine the timestamp granularity. */
 				bbr_make_timestamp_determination(bbr);
 			} else {
 				bbr->rc_ts_data_set = 1;
 				bbr->r_ctl.bbr_ts_check_tstmp = bbr->r_ctl.last_inbound_ts;
 				bbr->r_ctl.bbr_ts_check_our_cts = bbr->r_ctl.cur_rtt_send_time;
 			}
 		} else {
 			/*
 			 * We have to have consecutive acks
 			 * reset any "filled" state to none.
 			 */
 			bbr->rc_ts_data_set = 0;
 		}
 	}
 	/* Round it up */
 	rtt_ticks = USEC_2_TICKS((rtt + (USECS_IN_MSEC - 1)));
 	if (rtt_ticks == 0)
 		rtt_ticks = 1;
 	if (tp->t_srtt != 0) {
 		/*
 		 * srtt is stored as fixed point with 5 bits after the
 		 * binary point (i.e., scaled by 8).  The following magic is
 		 * equivalent to the smoothing algorithm in rfc793 with an
 		 * alpha of .875 (srtt = rtt/8 + srtt*7/8 in fixed point).
 		 * Adjust rtt to origin 0.
 		 */
 
 		delta = ((rtt_ticks - 1) << TCP_DELTA_SHIFT)
 		    - (tp->t_srtt >> (TCP_RTT_SHIFT - TCP_DELTA_SHIFT));
 
 		tp->t_srtt += delta;
 		if (tp->t_srtt <= 0)
 			tp->t_srtt = 1;
 
 		/*
 		 * We accumulate a smoothed rtt variance (actually, a
 		 * smoothed mean difference), then set the retransmit timer
 		 * to smoothed rtt + 4 times the smoothed variance. rttvar
 		 * is stored as fixed point with 4 bits after the binary
 		 * point (scaled by 16).  The following is equivalent to
 		 * rfc793 smoothing with an alpha of .75 (rttvar =
 		 * rttvar*3/4 + |delta| / 4).  This replaces rfc793's
 		 * wired-in beta.
 		 */
 		if (delta < 0)
 			delta = -delta;
 		delta -= tp->t_rttvar >> (TCP_RTTVAR_SHIFT - TCP_DELTA_SHIFT);
 		tp->t_rttvar += delta;
 		if (tp->t_rttvar <= 0)
 			tp->t_rttvar = 1;
 	} else {
 		/*
 		 * No rtt measurement yet - use the unsmoothed rtt. Set the
 		 * variance to half the rtt (so our first retransmit happens
 		 * at 3*rtt).
 		 */
 		tp->t_srtt = rtt_ticks << TCP_RTT_SHIFT;
 		tp->t_rttvar = rtt_ticks << (TCP_RTTVAR_SHIFT - 1);
 	}
 	KMOD_TCPSTAT_INC(tcps_rttupdated);
 	if (tp->t_rttupdated < UCHAR_MAX)
 		tp->t_rttupdated++;
 #ifdef STATS
 	stats_voi_update_abs_u32(tp->t_stats, VOI_TCP_RTT, imax(0, rtt_ticks));
 #endif
 	/*
 	 * the retransmit should happen at rtt + 4 * rttvar. Because of the
 	 * way we do the smoothing, srtt and rttvar will each average +1/2
 	 * tick of bias.  When we compute the retransmit timer, we want 1/2
 	 * tick of rounding and 1 extra tick because of +-1/2 tick
 	 * uncertainty in the firing of the timer.  The bias will give us
 	 * exactly the 1.5 tick we need.  But, because the bias is
 	 * statistical, we have to test that we don't drop below the minimum
 	 * feasible timer (which is 2 ticks).
 	 */
 	TCPT_RANGESET(tp->t_rxtcur, TCP_REXMTVAL(tp),
 	    max(MSEC_2_TICKS(bbr->r_ctl.rc_min_rto_ms), rtt_ticks + 2),
 	    MSEC_2_TICKS(((uint32_t)bbr->rc_max_rto_sec) * 1000));
 
 	/*
 	 * We received an ack for a packet that wasn't retransmitted; it is
 	 * probably safe to discard any error indications we've received
 	 * recently.  This isn't quite right, but close enough for now (a
 	 * route might have failed after we sent a segment, and the return
 	 * path might not be symmetrical).
 	 */
 	tp->t_softerror = 0;
 	rtt = (TICKS_2_USEC(bbr->rc_tp->t_srtt) >> TCP_RTT_SHIFT);
 	if (bbr->r_ctl.bbr_smallest_srtt_this_state > rtt)
 		bbr->r_ctl.bbr_smallest_srtt_this_state = rtt;
 }
 
 static void
 bbr_set_reduced_rtt(struct tcp_bbr *bbr, uint32_t cts, uint32_t line)
 {
 	bbr->r_ctl.rc_rtt_shrinks = cts;
 	if (bbr_can_force_probertt &&
 	    (TSTMP_GT(cts, bbr->r_ctl.last_in_probertt)) &&
 	    ((cts - bbr->r_ctl.last_in_probertt) > bbr->r_ctl.rc_probertt_int)) {
 		/*
 		 * We should enter probe-rtt its been too long
 		 * since we have been there.
 		 */
 		bbr_enter_probe_rtt(bbr, cts, __LINE__);
 	} else
 		bbr_check_probe_rtt_limits(bbr, cts);
 }
 
 static void
 tcp_bbr_commit_bw(struct tcp_bbr *bbr, uint32_t cts)
 {
 	uint64_t orig_bw;
 
 	if (bbr->r_ctl.rc_bbr_cur_del_rate == 0) {
 		/* We never apply a zero measurement */
 		bbr_log_type_bbrupd(bbr, 20, cts, 0, 0,
 				    0, 0, 0, 0, 0, 0);
 		return;
 	}
 	if (bbr->r_ctl.r_measurement_count < 0xffffffff)
 		bbr->r_ctl.r_measurement_count++;
 	orig_bw = get_filter_value(&bbr->r_ctl.rc_delrate);
 	apply_filter_max(&bbr->r_ctl.rc_delrate, bbr->r_ctl.rc_bbr_cur_del_rate, bbr->r_ctl.rc_pkt_epoch);
 	bbr_log_type_bbrupd(bbr, 21, cts, (uint32_t)orig_bw,
 			    (uint32_t)get_filter_value(&bbr->r_ctl.rc_delrate),
 			    0, 0, 0, 0, 0, 0);
 	if (orig_bw &&
 	    (orig_bw != get_filter_value(&bbr->r_ctl.rc_delrate))) {
 		if (bbr->bbr_hdrw_pacing) {
 			/*
 			 * Apply a new rate to the hardware
 			 * possibly.
 			 */
 			bbr_update_hardware_pacing_rate(bbr, cts);
 		}
 		bbr_set_state_target(bbr, __LINE__);
 		tcp_bbr_tso_size_check(bbr, cts);
 		if (bbr->r_recovery_bw)  {
 			bbr_setup_red_bw(bbr, cts);
 			bbr_log_type_bw_reduce(bbr, BBR_RED_BW_USELRBW);
 		}
 	} else if ((orig_bw == 0) && get_filter_value(&bbr->r_ctl.rc_delrate))
 		tcp_bbr_tso_size_check(bbr, cts);
 }
 
 static void
 bbr_nf_measurement(struct tcp_bbr *bbr, struct bbr_sendmap *rsm, uint32_t rtt, uint32_t cts)
 {
 	if (bbr->rc_in_persist == 0) {
 		/* We log only when not in persist */
 		/* Translate to a Bytes Per Second */
 		uint64_t tim, bw, ts_diff, ts_bw;
 		uint32_t delivered;
 
 		if (TSTMP_GT(bbr->r_ctl.rc_del_time, rsm->r_del_time))
 			tim = (uint64_t)(bbr->r_ctl.rc_del_time - rsm->r_del_time);
 		else
 			tim = 1;
 		/*
 		 * Now that we have processed the tim (skipping the sample
 		 * or possibly updating the time, go ahead and
 		 * calculate the cdr.
 		 */
 		delivered = (bbr->r_ctl.rc_delivered - rsm->r_delivered);
 		bw = (uint64_t)delivered;
 		bw *= (uint64_t)USECS_IN_SECOND;
 		bw /= tim;
 		if (bw == 0) {
 			/* We must have a calculatable amount */
 			return;
 		}
 		/*
 		 * If we are using this b/w shove it in now so we
 		 * can see in the trace viewer if it gets over-ridden.
 		 */
 		if (rsm->r_ts_valid &&
 		    bbr->rc_ts_valid &&
 		    bbr->rc_ts_clock_set &&
 		    (bbr->rc_ts_cant_be_used == 0) &&
 		    bbr->rc_use_ts_limit) {
 			ts_diff = max((bbr->r_ctl.last_inbound_ts - rsm->r_del_ack_ts), 1);
 			ts_diff *= bbr->r_ctl.bbr_peer_tsratio;
 			if ((delivered == 0) ||
 			    (rtt < 1000)) {
 				/* Can't use the ts */
 				bbr_log_type_bbrupd(bbr, 61, cts,
 						    ts_diff,
 						    bbr->r_ctl.last_inbound_ts,
 						    rsm->r_del_ack_ts, 0,
 						    0, 0, 0, delivered);
 			} else {
 				ts_bw = (uint64_t)delivered;
 				ts_bw *= (uint64_t)USECS_IN_SECOND;
 				ts_bw /= ts_diff;
 				bbr_log_type_bbrupd(bbr, 62, cts,
 						    (ts_bw >> 32),
 						    (ts_bw & 0xffffffff), 0, 0,
 						    0, 0, ts_diff, delivered);
 				if ((bbr->ts_can_raise) &&
 				    (ts_bw > bw)) {
 					bbr_log_type_bbrupd(bbr, 8, cts,
 							    delivered,
 							    ts_diff,
 							    (bw >> 32),
 							    (bw & 0x00000000ffffffff),
 							    0, 0, 0, 0);
 					bw = ts_bw;
 				} else if (ts_bw && (ts_bw < bw)) {
 					bbr_log_type_bbrupd(bbr, 7, cts,
 							    delivered,
 							    ts_diff,
 							    (bw >> 32),
 							    (bw & 0x00000000ffffffff),
 							    0, 0, 0, 0);
 					bw = ts_bw;
 				}
 			}
 		}
 		if (rsm->r_first_sent_time &&
 		    TSTMP_GT(rsm->r_tim_lastsent[(rsm->r_rtr_cnt -1)],rsm->r_first_sent_time)) {
 			uint64_t sbw, sti;
 			/*
 			 * We use what was in flight at the time of our
 			 * send  and the size of this send to figure
 			 * out what we have been sending at (amount).
 			 * For the time we take from the time of
 			 * the send of the first send outstanding
 			 * until this send plus this sends pacing
 			 * time. This gives us a good calculation
 			 * as to the rate we have been sending at.
 			 */
 
 			sbw = (uint64_t)(rsm->r_flight_at_send);
 			sbw *= (uint64_t)USECS_IN_SECOND;
 			sti = rsm->r_tim_lastsent[(rsm->r_rtr_cnt -1)] - rsm->r_first_sent_time;
 			sti += rsm->r_pacing_delay;
 			sbw /= sti;
 			if (sbw < bw) {
 				bbr_log_type_bbrupd(bbr, 6, cts,
 						    delivered,
 						    (uint32_t)sti,
 						    (bw >> 32),
 						    (uint32_t)bw,
 						    rsm->r_first_sent_time, 0, (sbw >> 32),
 						    (uint32_t)sbw);
 				bw = sbw;
 			}
 		}
 		/* Use the google algorithm for b/w measurements */
 		bbr->r_ctl.rc_bbr_cur_del_rate = bw;
 		if ((rsm->r_app_limited == 0) ||
 		    (bw > get_filter_value(&bbr->r_ctl.rc_delrate))) {
 			tcp_bbr_commit_bw(bbr, cts);
 			bbr_log_type_bbrupd(bbr, 10, cts, (uint32_t)tim, delivered,
 					    0, 0, 0, 0,  bbr->r_ctl.rc_del_time,  rsm->r_del_time);
 		}
 	}
 }
 
 static void
 bbr_google_measurement(struct tcp_bbr *bbr, struct bbr_sendmap *rsm, uint32_t rtt, uint32_t cts)
 {
 	if (bbr->rc_in_persist == 0) {
 		/* We log only when not in persist */
 		/* Translate to a Bytes Per Second */
 		uint64_t tim, bw;
 		uint32_t delivered;
 		int no_apply = 0;
 
 		if (TSTMP_GT(bbr->r_ctl.rc_del_time, rsm->r_del_time))
 			tim = (uint64_t)(bbr->r_ctl.rc_del_time - rsm->r_del_time);
 		else
 			tim = 1;
 		/*
 		 * Now that we have processed the tim (skipping the sample
 		 * or possibly updating the time, go ahead and
 		 * calculate the cdr.
 		 */
 		delivered = (bbr->r_ctl.rc_delivered - rsm->r_delivered);
 		bw = (uint64_t)delivered;
 		bw *= (uint64_t)USECS_IN_SECOND;
 		bw /= tim;
 		if (tim < bbr->r_ctl.rc_lowest_rtt) {
 			bbr_log_type_bbrupd(bbr, 99, cts, (uint32_t)tim, delivered,
 					    tim, bbr->r_ctl.rc_lowest_rtt, 0, 0, 0, 0);
 
 			no_apply = 1;
 		}
 		/*
 		 * If we are using this b/w shove it in now so we
 		 * can see in the trace viewer if it gets over-ridden.
 		 */
 		bbr->r_ctl.rc_bbr_cur_del_rate = bw;
 		/* Gate by the sending rate */
 		if (rsm->r_first_sent_time &&
 		    TSTMP_GT(rsm->r_tim_lastsent[(rsm->r_rtr_cnt -1)],rsm->r_first_sent_time)) {
 			uint64_t sbw, sti;
 			/*
 			 * We use what was in flight at the time of our
 			 * send  and the size of this send to figure
 			 * out what we have been sending at (amount).
 			 * For the time we take from the time of
 			 * the send of the first send outstanding
 			 * until this send plus this sends pacing
 			 * time. This gives us a good calculation
 			 * as to the rate we have been sending at.
 			 */
 
 			sbw = (uint64_t)(rsm->r_flight_at_send);
 			sbw *= (uint64_t)USECS_IN_SECOND;
 			sti = rsm->r_tim_lastsent[(rsm->r_rtr_cnt -1)] - rsm->r_first_sent_time;
 			sti += rsm->r_pacing_delay;
 			sbw /= sti;
 			if (sbw < bw) {
 				bbr_log_type_bbrupd(bbr, 6, cts,
 						    delivered,
 						    (uint32_t)sti,
 						    (bw >> 32),
 						    (uint32_t)bw,
 						    rsm->r_first_sent_time, 0, (sbw >> 32),
 						    (uint32_t)sbw);
 				bw = sbw;
 			}
 			if ((sti > tim) &&
 			    (sti < bbr->r_ctl.rc_lowest_rtt)) {
 				bbr_log_type_bbrupd(bbr, 99, cts, (uint32_t)tim, delivered,
 						    (uint32_t)sti, bbr->r_ctl.rc_lowest_rtt, 0, 0, 0, 0);
 				no_apply = 1;
 			} else
 				no_apply = 0;
 		}
 		bbr->r_ctl.rc_bbr_cur_del_rate = bw;
 		if ((no_apply == 0) &&
 		    ((rsm->r_app_limited == 0) ||
 		     (bw > get_filter_value(&bbr->r_ctl.rc_delrate)))) {
 			tcp_bbr_commit_bw(bbr, cts);
 			bbr_log_type_bbrupd(bbr, 10, cts, (uint32_t)tim, delivered,
 					    0, 0, 0, 0, bbr->r_ctl.rc_del_time,  rsm->r_del_time);
 		}
 	}
 }
 
 static void
 bbr_update_bbr_info(struct tcp_bbr *bbr, struct bbr_sendmap *rsm, uint32_t rtt, uint32_t cts, uint32_t tsin,
     uint32_t uts, int32_t match, uint32_t rsm_send_time, int32_t ack_type, struct tcpopt *to)
 {
 	uint64_t old_rttprop;
 
 	/* Update our delivery time and amount */
 	bbr->r_ctl.rc_delivered += (rsm->r_end - rsm->r_start);
 	bbr->r_ctl.rc_del_time = cts;
 	if (rtt == 0) {
 		/*
 		 * 0 means its a retransmit, for now we don't use these for
 		 * the rest of BBR.
 		 */
 		return;
 	}
 	if ((bbr->rc_use_google == 0) &&
 	    (match != BBR_RTT_BY_EXACTMATCH) &&
 	    (match != BBR_RTT_BY_TIMESTAMP)){
 		/*
 		 * We get a lot of rtt updates, lets not pay attention to
 		 * any that are not an exact match. That way we don't have
 		 * to worry about timestamps and the whole nonsense of
 		 * unsure if its a retransmission etc (if we ever had the
 		 * timestamp fixed to always have the last thing sent this
 		 * would not be a issue).
 		 */
 		return;
 	}
 	if ((bbr_no_retran && bbr->rc_use_google) &&
 	    (match != BBR_RTT_BY_EXACTMATCH) &&
 	    (match != BBR_RTT_BY_TIMESTAMP)){
 		/*
 		 * We only do measurements in google mode
 		 * with bbr_no_retran on for sure things.
 		 */
 		return;
 	}
 	/* Only update srtt if we know by exact match */
 	tcp_bbr_xmit_timer(bbr, rtt, rsm_send_time, rsm->r_start, tsin);
 	if (ack_type == BBR_CUM_ACKED)
 		bbr->rc_ack_is_cumack = 1;
 	else
 		bbr->rc_ack_is_cumack = 0;
 	old_rttprop = bbr_get_rtt(bbr, BBR_RTT_PROP);
 	/*
 	 * Note the following code differs to the original
 	 * BBR spec. It calls for <= not <. However after a
 	 * long discussion in email with Neal, he acknowledged
 	 * that it should be < than so that we will have flows
 	 * going into probe-rtt (we were seeing cases where that
 	 * did not happen and caused ugly things to occur). We
 	 * have added this agreed upon fix to our code base.
 	 */
 	if (rtt < old_rttprop) {
 		/* Update when we last saw a rtt drop */
 		bbr_log_rtt_shrinks(bbr, cts, 0, rtt, __LINE__, BBR_RTTS_NEWRTT, 0);
 		bbr_set_reduced_rtt(bbr, cts, __LINE__);
 	}
 	bbr_log_type_bbrrttprop(bbr, rtt, (rsm ? rsm->r_end : 0), uts, cts,
 	    match, rsm->r_start, rsm->r_flags);
 	apply_filter_min_small(&bbr->r_ctl.rc_rttprop, rtt, cts);
 	if (old_rttprop != bbr_get_rtt(bbr, BBR_RTT_PROP)) {
 		/*
 		 * The RTT-prop moved, reset the target (may be a
 		 * nop for some states).
 		 */
 		bbr_set_state_target(bbr, __LINE__);
 		if (bbr->rc_bbr_state == BBR_STATE_PROBE_RTT)
 			bbr_log_rtt_shrinks(bbr, cts, 0, 0,
 					    __LINE__, BBR_RTTS_NEW_TARGET, 0);
 		else if (old_rttprop < bbr_get_rtt(bbr, BBR_RTT_PROP))
 			/* It went up */
 			bbr_check_probe_rtt_limits(bbr, cts);
 	}
 	if ((bbr->rc_use_google == 0) &&
 	    (match == BBR_RTT_BY_TIMESTAMP)) {
 		/*
 		 * We don't do b/w update with
 		 * these since they are not really
 		 * reliable.
 		 */
 		return;
 	}
 	if (bbr->r_ctl.r_app_limited_until &&
 	    (bbr->r_ctl.rc_delivered >= bbr->r_ctl.r_app_limited_until)) {
 		/* We are no longer app-limited */
 		bbr->r_ctl.r_app_limited_until = 0;
 	}
 	if (bbr->rc_use_google) {
 		bbr_google_measurement(bbr, rsm, rtt, cts);
 	} else {
 		bbr_nf_measurement(bbr, rsm, rtt, cts);
 	}
 }
 
 /*
  * Convert a timestamp that the main stack
  * uses (milliseconds) into one that bbr uses
  * (microseconds). Return that converted timestamp.
  */
 static uint32_t
 bbr_ts_convert(uint32_t cts) {
 	uint32_t sec, msec;
 
 	sec = cts / MS_IN_USEC;
 	msec = cts - (MS_IN_USEC * sec);
 	return ((sec * USECS_IN_SECOND) + (msec * MS_IN_USEC));
 }
 
 /*
  * Return 0 if we did not update the RTT time, return
  * 1 if we did.
  */
 static int
 bbr_update_rtt(struct tcpcb *tp, struct tcp_bbr *bbr,
     struct bbr_sendmap *rsm, struct tcpopt *to, uint32_t cts, int32_t ack_type, uint32_t th_ack)
 {
 	int32_t i;
 	uint32_t t, uts = 0;
 
 	if ((rsm->r_flags & BBR_ACKED) ||
 	    (rsm->r_flags & BBR_WAS_RENEGED) ||
 	    (rsm->r_flags & BBR_RXT_CLEARED)) {
 		/* Already done */
 		return (0);
 	}
 	if (rsm->r_rtt_not_allowed) {
 		/* Not allowed */
 		return (0);
 	}
 	if (rsm->r_rtr_cnt == 1) {
 		/*
 		 * Only one transmit. Hopefully the normal case.
 		 */
 		if (TSTMP_GT(cts, rsm->r_tim_lastsent[0]))
 			t = cts - rsm->r_tim_lastsent[0];
 		else
 			t = 1;
 		if ((int)t <= 0)
 			t = 1;
 		bbr->r_ctl.rc_last_rtt = t;
 		bbr_update_bbr_info(bbr, rsm, t, cts, to->to_tsecr, 0,
 				    BBR_RTT_BY_EXACTMATCH, rsm->r_tim_lastsent[0], ack_type, to);
 		return (1);
 	}
 	/* Convert to usecs */
 	if ((bbr_can_use_ts_for_rtt == 1) &&
 	    (bbr->rc_use_google == 1) &&
 	    (ack_type == BBR_CUM_ACKED) &&
 	    (to->to_flags & TOF_TS) &&
 	    (to->to_tsecr != 0)) {
 		t = tcp_tv_to_mssectick(&bbr->rc_tv) - to->to_tsecr;
 		if (t < 1)
 			t = 1;
 		t *= MS_IN_USEC;
 		bbr_update_bbr_info(bbr, rsm, t, cts, to->to_tsecr, 0,
 				    BBR_RTT_BY_TIMESTAMP,
 				    rsm->r_tim_lastsent[(rsm->r_rtr_cnt-1)],
 				    ack_type, to);
 		return (1);
 	}
 	uts = bbr_ts_convert(to->to_tsecr);
 	if ((to->to_flags & TOF_TS) &&
 	    (to->to_tsecr != 0) &&
 	    (ack_type == BBR_CUM_ACKED) &&
 	    ((rsm->r_flags & BBR_OVERMAX) == 0)) {
 		/*
 		 * Now which timestamp does it match? In this block the ACK
 		 * may be coming from a previous transmission.
 		 */
 		uint32_t fudge;
 
 		fudge = BBR_TIMER_FUDGE;
 		for (i = 0; i < rsm->r_rtr_cnt; i++) {
 			if ((SEQ_GEQ(uts, (rsm->r_tim_lastsent[i] - fudge))) &&
 			    (SEQ_LEQ(uts, (rsm->r_tim_lastsent[i] + fudge)))) {
 				if (TSTMP_GT(cts, rsm->r_tim_lastsent[i]))
 					t = cts - rsm->r_tim_lastsent[i];
 				else
 					t = 1;
 				if ((int)t <= 0)
 					t = 1;
 				bbr->r_ctl.rc_last_rtt = t;
 				bbr_update_bbr_info(bbr, rsm, t, cts, to->to_tsecr, uts, BBR_RTT_BY_TSMATCHING,
 						    rsm->r_tim_lastsent[i], ack_type, to);
 				if ((i + 1) < rsm->r_rtr_cnt) {
 					/* Likely */
 					return (0);
 				} else if (rsm->r_flags & BBR_TLP) {
 					bbr->rc_tlp_rtx_out = 0;
 				}
 				return (1);
 			}
 		}
 		/* Fall through if we can't find a matching timestamp */
 	}
 	/*
 	 * Ok its a SACK block that we retransmitted. or a windows
 	 * machine without timestamps. We can tell nothing from the
 	 * time-stamp since its not there or the time the peer last
 	 * recieved a segment that moved forward its cum-ack point.
 	 *
 	 * Lets look at the last retransmit and see what we can tell
 	 * (with BBR for space we only keep 2 note we have to keep
 	 * at least 2 so the map can not be condensed more).
 	 */
 	i = rsm->r_rtr_cnt - 1;
 	if (TSTMP_GT(cts, rsm->r_tim_lastsent[i]))
 		t = cts - rsm->r_tim_lastsent[i];
 	else
 		goto not_sure;
 	if (t < bbr->r_ctl.rc_lowest_rtt) {
 		/*
 		 * We retransmitted and the ack came back in less
 		 * than the smallest rtt we have observed in the
 		 * windowed rtt. We most likey did an improper
 		 * retransmit as outlined in 4.2 Step 3 point 2 in
 		 * the rack-draft.
 		 *
 		 * Use the prior transmission to update all the
 		 * information as long as there is only one prior
 		 * transmission.
 		 */
 		if ((rsm->r_flags & BBR_OVERMAX) == 0) {
 #ifdef BBR_INVARIANTS
 			if (rsm->r_rtr_cnt == 1)
 				panic("rsm:%p bbr:%p rsm has overmax and only 1 retranmit flags:%x?", rsm, bbr, rsm->r_flags);
 #endif
 			i = rsm->r_rtr_cnt - 2;
 			if (TSTMP_GT(cts, rsm->r_tim_lastsent[i]))
 				t = cts - rsm->r_tim_lastsent[i];
 			else
 				t = 1;
 			bbr_update_bbr_info(bbr, rsm, t, cts, to->to_tsecr, uts, BBR_RTT_BY_EARLIER_RET,
 					    rsm->r_tim_lastsent[i], ack_type, to);
 			return (0);
 		} else {
 			/*
 			 * Too many prior transmissions, just
 			 * updated BBR delivered
 			 */
 not_sure:
 			bbr_update_bbr_info(bbr, rsm, 0, cts, to->to_tsecr, uts,
 					    BBR_RTT_BY_SOME_RETRAN, 0, ack_type, to);
 		}
 	} else {
 		/*
 		 * We retransmitted it and the retransmit did the
 		 * job.
 		 */
 		if (rsm->r_flags & BBR_TLP)
 			bbr->rc_tlp_rtx_out = 0;
 		if ((rsm->r_flags & BBR_OVERMAX) == 0)
 			bbr_update_bbr_info(bbr, rsm, t, cts, to->to_tsecr, uts,
 					    BBR_RTT_BY_THIS_RETRAN, 0, ack_type, to);
 		else
 			bbr_update_bbr_info(bbr, rsm, 0, cts, to->to_tsecr, uts,
 					    BBR_RTT_BY_SOME_RETRAN, 0, ack_type, to);
 		return (1);
 	}
 	return (0);
 }
 
 /*
  * Mark the SACK_PASSED flag on all entries prior to rsm send wise.
  */
 static void
 bbr_log_sack_passed(struct tcpcb *tp,
     struct tcp_bbr *bbr, struct bbr_sendmap *rsm)
 {
 	struct bbr_sendmap *nrsm;
 
 	nrsm = rsm;
 	TAILQ_FOREACH_REVERSE_FROM(nrsm, &bbr->r_ctl.rc_tmap,
 	    bbr_head, r_tnext) {
 		if (nrsm == rsm) {
 			/* Skip original segment he is acked */
 			continue;
 		}
 		if (nrsm->r_flags & BBR_ACKED) {
 			/* Skip ack'd segments */
 			continue;
 		}
 		if (nrsm->r_flags & BBR_SACK_PASSED) {
 			/*
 			 * We found one that is already marked
 			 * passed, we have been here before and
 			 * so all others below this are marked.
 			 */
 			break;
 		}
 		BBR_STAT_INC(bbr_sack_passed);
 		nrsm->r_flags |= BBR_SACK_PASSED;
 		if (((nrsm->r_flags & BBR_MARKED_LOST) == 0) &&
 		    bbr_is_lost(bbr, nrsm, bbr->r_ctl.rc_rcvtime)) {
 			bbr->r_ctl.rc_lost += nrsm->r_end - nrsm->r_start;
 			bbr->r_ctl.rc_lost_bytes += nrsm->r_end - nrsm->r_start;
 			nrsm->r_flags |= BBR_MARKED_LOST;
 		}
 		nrsm->r_flags &= ~BBR_WAS_SACKPASS;
 	}
 }
 
 /*
  * Returns the number of bytes that were
  * newly ack'd by sack blocks.
  */
 static uint32_t
 bbr_proc_sack_blk(struct tcpcb *tp, struct tcp_bbr *bbr, struct sackblk *sack,
     struct tcpopt *to, struct bbr_sendmap **prsm, uint32_t cts)
 {
 	int32_t times = 0;
 	uint32_t start, end, changed = 0;
 	struct bbr_sendmap *rsm, *nrsm;
 	int32_t used_ref = 1;
 	uint8_t went_back = 0, went_fwd = 0;
 
 	start = sack->start;
 	end = sack->end;
 	rsm = *prsm;
 	if (rsm == NULL)
 		used_ref = 0;
 
 	/* Do we locate the block behind where we last were? */
 	if (rsm && SEQ_LT(start, rsm->r_start)) {
 		went_back = 1;
 		TAILQ_FOREACH_REVERSE_FROM(rsm, &bbr->r_ctl.rc_map, bbr_head, r_next) {
 			if (SEQ_GEQ(start, rsm->r_start) &&
 			    SEQ_LT(start, rsm->r_end)) {
 				goto do_rest_ofb;
 			}
 		}
 	}
 start_at_beginning:
 	went_fwd = 1;
 	/*
 	 * Ok lets locate the block where this guy is fwd from rsm (if its
 	 * set)
 	 */
 	TAILQ_FOREACH_FROM(rsm, &bbr->r_ctl.rc_map, r_next) {
 		if (SEQ_GEQ(start, rsm->r_start) &&
 		    SEQ_LT(start, rsm->r_end)) {
 			break;
 		}
 	}
 do_rest_ofb:
 	if (rsm == NULL) {
 		/*
 		 * This happens when we get duplicate sack blocks with the
 		 * same end. For example SACK 4: 100 SACK 3: 100 The sort
 		 * will not change there location so we would just start at
 		 * the end of the first one and get lost.
 		 */
 		if (tp->t_flags & TF_SENTFIN) {
 			/*
 			 * Check to see if we have not logged the FIN that
 			 * went out.
 			 */
 			nrsm = TAILQ_LAST_FAST(&bbr->r_ctl.rc_map, bbr_sendmap, r_next);
 			if (nrsm && (nrsm->r_end + 1) == tp->snd_max) {
 				/*
 				 * Ok we did not get the FIN logged.
 				 */
 				nrsm->r_end++;
 				rsm = nrsm;
 				goto do_rest_ofb;
 			}
 		}
 		if (times == 1) {
 #ifdef BBR_INVARIANTS
 			panic("tp:%p bbr:%p sack:%p to:%p prsm:%p",
 			    tp, bbr, sack, to, prsm);
 #else
 			goto out;
 #endif
 		}
 		times++;
 		BBR_STAT_INC(bbr_sack_proc_restart);
 		rsm = NULL;
 		goto start_at_beginning;
 	}
 	/* Ok we have an ACK for some piece of rsm */
 	if (rsm->r_start != start) {
 		/*
 		 * Need to split this in two pieces the before and after.
 		 */
 		if (bbr_sack_mergable(rsm, start, end))
 			nrsm = bbr_alloc_full_limit(bbr);
 		else
 			nrsm = bbr_alloc_limit(bbr, BBR_LIMIT_TYPE_SPLIT);
 		if (nrsm == NULL) {
 			/* We could not allocate ignore the sack */
 			struct sackblk blk;
 
 			blk.start = start;
 			blk.end = end;
 			sack_filter_reject(&bbr->r_ctl.bbr_sf, &blk);
 			goto out;
 		}
 		bbr_clone_rsm(bbr, nrsm, rsm, start);
 		TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 		if (rsm->r_in_tmap) {
 			TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 			nrsm->r_in_tmap = 1;
 		}
 		rsm->r_flags &= (~BBR_HAS_FIN);
 		rsm = nrsm;
 	}
 	if (SEQ_GEQ(end, rsm->r_end)) {
 		/*
 		 * The end of this block is either beyond this guy or right
 		 * at this guy.
 		 */
 		if ((rsm->r_flags & BBR_ACKED) == 0) {
 			bbr_update_rtt(tp, bbr, rsm, to, cts, BBR_SACKED, 0);
 			changed += (rsm->r_end - rsm->r_start);
 			bbr->r_ctl.rc_sacked += (rsm->r_end - rsm->r_start);
 			bbr_log_sack_passed(tp, bbr, rsm);
 			if (rsm->r_flags & BBR_MARKED_LOST) {
 				bbr->r_ctl.rc_lost_bytes -= rsm->r_end - rsm->r_start;
 			}
 			/* Is Reordering occuring? */
 			if (rsm->r_flags & BBR_SACK_PASSED) {
 				BBR_STAT_INC(bbr_reorder_seen);
 				bbr->r_ctl.rc_reorder_ts = cts;
 				if (rsm->r_flags & BBR_MARKED_LOST) {
 					bbr->r_ctl.rc_lost -= rsm->r_end - rsm->r_start;
 					if (SEQ_GT(bbr->r_ctl.rc_lt_lost, bbr->r_ctl.rc_lost))
 						/* LT sampling also needs adjustment */
 						bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 				}
 			}
 			rsm->r_flags |= BBR_ACKED;
 			rsm->r_flags &= ~(BBR_TLP|BBR_WAS_RENEGED|BBR_RXT_CLEARED|BBR_MARKED_LOST);
 			if (rsm->r_in_tmap) {
 				TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 				rsm->r_in_tmap = 0;
 			}
 		}
 		bbr_isit_a_pkt_epoch(bbr, cts, rsm, __LINE__, BBR_SACKED);
 		if (end == rsm->r_end) {
 			/* This block only - done */
 			goto out;
 		}
 		/* There is more not coverend by this rsm move on */
 		start = rsm->r_end;
 		nrsm = TAILQ_NEXT(rsm, r_next);
 		rsm = nrsm;
 		times = 0;
 		goto do_rest_ofb;
 	}
 	if (rsm->r_flags & BBR_ACKED) {
 		/* Been here done that */
 		goto out;
 	}
 	/* Ok we need to split off this one at the tail */
 	if (bbr_sack_mergable(rsm, start, end))
 		nrsm = bbr_alloc_full_limit(bbr);
 	else
 		nrsm = bbr_alloc_limit(bbr, BBR_LIMIT_TYPE_SPLIT);
 	if (nrsm == NULL) {
 		/* failed XXXrrs what can we do but loose the sack info? */
 		struct sackblk blk;
 
 		blk.start = start;
 		blk.end = end;
 		sack_filter_reject(&bbr->r_ctl.bbr_sf, &blk);
 		goto out;
 	}
 	/* Clone it */
 	bbr_clone_rsm(bbr, nrsm, rsm, end);
 	/* The sack block does not cover this guy fully */
 	rsm->r_flags &= (~BBR_HAS_FIN);
 	TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 	if (rsm->r_in_tmap) {
 		TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 		nrsm->r_in_tmap = 1;
 	}
 	nrsm->r_dupack = 0;
 	bbr_update_rtt(tp, bbr, rsm, to, cts, BBR_SACKED, 0);
 	bbr_isit_a_pkt_epoch(bbr, cts, rsm, __LINE__, BBR_SACKED);
 	changed += (rsm->r_end - rsm->r_start);
 	bbr->r_ctl.rc_sacked += (rsm->r_end - rsm->r_start);
 	bbr_log_sack_passed(tp, bbr, rsm);
 	/* Is Reordering occuring? */
 	if (rsm->r_flags & BBR_MARKED_LOST) {
 		bbr->r_ctl.rc_lost_bytes -= rsm->r_end - rsm->r_start;
 	}
 	if (rsm->r_flags & BBR_SACK_PASSED) {
 		BBR_STAT_INC(bbr_reorder_seen);
 		bbr->r_ctl.rc_reorder_ts = cts;
 		if (rsm->r_flags & BBR_MARKED_LOST) {
 			bbr->r_ctl.rc_lost -= rsm->r_end - rsm->r_start;
 			if (SEQ_GT(bbr->r_ctl.rc_lt_lost, bbr->r_ctl.rc_lost))
 				/* LT sampling also needs adjustment */
 				bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 		}
 	}
 	rsm->r_flags &= ~(BBR_TLP|BBR_WAS_RENEGED|BBR_RXT_CLEARED|BBR_MARKED_LOST);
 	rsm->r_flags |= BBR_ACKED;
 	if (rsm->r_in_tmap) {
 		TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 		rsm->r_in_tmap = 0;
 	}
 out:
 	if (rsm && (rsm->r_flags & BBR_ACKED)) {
 		/*
 		 * Now can we merge this newly acked
 		 * block with either the previous or
 		 * next block?
 		 */
 		nrsm = TAILQ_NEXT(rsm, r_next);
 		if (nrsm &&
 		    (nrsm->r_flags & BBR_ACKED)) {
 			/* yep this and next can be merged */
 			rsm = bbr_merge_rsm(bbr, rsm, nrsm);
 		}
 		/* Now what about the previous? */
 		nrsm = TAILQ_PREV(rsm, bbr_head, r_next);
 		if (nrsm &&
 		    (nrsm->r_flags & BBR_ACKED)) {
 			/* yep the previous and this can be merged */
 			rsm = bbr_merge_rsm(bbr, nrsm, rsm);
 		}
 	}
 	if (used_ref == 0) {
 		BBR_STAT_INC(bbr_sack_proc_all);
 	} else {
 		BBR_STAT_INC(bbr_sack_proc_short);
 	}
 	if (went_fwd && went_back) {
 		BBR_STAT_INC(bbr_sack_search_both);
 	} else if (went_fwd) {
 		BBR_STAT_INC(bbr_sack_search_fwd);
 	} else if (went_back) {
 		BBR_STAT_INC(bbr_sack_search_back);
 	}
 	/* Save off where the next seq is */
 	if (rsm)
 		bbr->r_ctl.rc_sacklast = TAILQ_NEXT(rsm, r_next);
 	else
 		bbr->r_ctl.rc_sacklast = NULL;
 	*prsm = rsm;
 	return (changed);
 }
 
 static void inline
 bbr_peer_reneges(struct tcp_bbr *bbr, struct bbr_sendmap *rsm, tcp_seq th_ack)
 {
 	struct bbr_sendmap *tmap;
 
 	BBR_STAT_INC(bbr_reneges_seen);
 	tmap = NULL;
 	while (rsm && (rsm->r_flags & BBR_ACKED)) {
 		/* Its no longer sacked, mark it so */
 		uint32_t oflags;
 		bbr->r_ctl.rc_sacked -= (rsm->r_end - rsm->r_start);
 #ifdef BBR_INVARIANTS
 		if (rsm->r_in_tmap) {
 			panic("bbr:%p rsm:%p flags:0x%x in tmap?",
 			    bbr, rsm, rsm->r_flags);
 		}
 #endif
 		oflags = rsm->r_flags;
 		if (rsm->r_flags & BBR_MARKED_LOST) {
 			bbr->r_ctl.rc_lost -= rsm->r_end - rsm->r_start;
 			bbr->r_ctl.rc_lost_bytes -= rsm->r_end - rsm->r_start;
 			if (SEQ_GT(bbr->r_ctl.rc_lt_lost, bbr->r_ctl.rc_lost))
 				/* LT sampling also needs adjustment */
 				bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 		}
 		rsm->r_flags &= ~(BBR_ACKED | BBR_SACK_PASSED | BBR_WAS_SACKPASS | BBR_MARKED_LOST);
 		rsm->r_flags |= BBR_WAS_RENEGED;
 		rsm->r_flags |= BBR_RXT_CLEARED;
 		bbr_log_type_rsmclear(bbr, bbr->r_ctl.rc_rcvtime, rsm, oflags, __LINE__);
 		/* Rebuild it into our tmap */
 		if (tmap == NULL) {
 			TAILQ_INSERT_HEAD(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 			tmap = rsm;
 		} else {
 			TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, tmap, rsm, r_tnext);
 			tmap = rsm;
 		}
 		tmap->r_in_tmap = 1;
 		/*
 		 * XXXrrs Delivered? Should we do anything here?
 		 *
 		 * Of course we don't on a rxt timeout so maybe its ok that
 		 * we don't?
 		 *
 		 * For now lets not.
 		 */
 		rsm = TAILQ_NEXT(rsm, r_next);
 	}
 	/*
 	 * Now lets possibly clear the sack filter so we start recognizing
 	 * sacks that cover this area.
 	 */
 	sack_filter_clear(&bbr->r_ctl.bbr_sf, th_ack);
 }
 
 static void
 bbr_log_syn(struct tcpcb *tp, struct tcpopt *to)
 {
 	struct tcp_bbr *bbr;
 	struct bbr_sendmap *rsm;
 	uint32_t cts;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	cts = bbr->r_ctl.rc_rcvtime;
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 	if (rsm && (rsm->r_flags & BBR_HAS_SYN)) {
 		if ((rsm->r_end - rsm->r_start) <= 1) {
 			/* Log out the SYN completely */
 			bbr->r_ctl.rc_holes_rxt -= rsm->r_rtr_bytes;
 			rsm->r_rtr_bytes = 0;
 			TAILQ_REMOVE(&bbr->r_ctl.rc_map, rsm, r_next);
 			if (rsm->r_in_tmap) {
 				TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 				rsm->r_in_tmap = 0;
 			}
 			if (bbr->r_ctl.rc_next == rsm) {
 				/* scoot along the marker */
 				bbr->r_ctl.rc_next = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 			}
 			if (to != NULL)
 				bbr_update_rtt(tp, bbr, rsm, to, cts, BBR_CUM_ACKED, 0);
 			bbr_free(bbr, rsm);
 		} else {
 			/* There is more (Fast open)? strip out SYN. */
 			rsm->r_flags &= ~BBR_HAS_SYN;
 			rsm->r_start++;
 		}
 	}
 }
 
 /*
  * Returns the number of bytes that were
  * acknowledged by SACK blocks.
  */
 
 static uint32_t
 bbr_log_ack(struct tcpcb *tp, struct tcpopt *to, struct tcphdr *th,
     uint32_t *prev_acked)
 {
 	uint32_t changed, last_seq, entered_recovery = 0;
 	struct tcp_bbr *bbr;
 	struct bbr_sendmap *rsm;
 	struct sackblk sack, sack_blocks[TCP_MAX_SACK + 1];
 	register uint32_t th_ack;
 	int32_t i, j, k, new_sb, num_sack_blks = 0;
 	uint32_t cts, acked, ack_point, sack_changed = 0;
 	uint32_t p_maxseg, maxseg, p_acked = 0;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	if (tcp_get_flags(th) & TH_RST) {
 		/* We don't log resets */
 		return (0);
 	}
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	cts = bbr->r_ctl.rc_rcvtime;
 
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 	changed = 0;
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	p_maxseg = min(bbr->r_ctl.rc_pace_max_segs, maxseg);
 	th_ack = th->th_ack;
 	if (SEQ_GT(th_ack, tp->snd_una)) {
 		acked = th_ack - tp->snd_una;
 		bbr_log_progress_event(bbr, tp, ticks, PROGRESS_UPDATE, __LINE__);
 		bbr->rc_tp->t_acktime = ticks;
 	} else
 		acked = 0;
 	if (SEQ_LEQ(th_ack, tp->snd_una)) {
 		/* Only sent here for sack processing */
 		goto proc_sack;
 	}
 	if (rsm && SEQ_GT(th_ack, rsm->r_start)) {
 		changed = th_ack - rsm->r_start;
 	} else if ((rsm == NULL) && ((th_ack - 1) == tp->iss)) {
 		/*
 		 * For the SYN incoming case we will not have called
 		 * tcp_output for the sending of the SYN, so there will be
 		 * no map. All other cases should probably be a panic.
 		 */
 		if ((to->to_flags & TOF_TS) && (to->to_tsecr != 0)) {
 			/*
 			 * We have a timestamp that can be used to generate
 			 * an initial RTT.
 			 */
 			uint32_t ts, now, rtt;
 
 			ts = bbr_ts_convert(to->to_tsecr);
 			now = bbr_ts_convert(tcp_tv_to_mssectick(&bbr->rc_tv));
 			rtt = now - ts;
 			if (rtt < 1)
 				rtt = 1;
 			bbr_log_type_bbrrttprop(bbr, rtt,
 						tp->iss, 0, cts,
 						BBR_RTT_BY_TIMESTAMP, tp->iss, 0);
 			apply_filter_min_small(&bbr->r_ctl.rc_rttprop, rtt, cts);
 			changed = 1;
 			bbr->r_wanted_output = 1;
 			goto out;
 		}
 		goto proc_sack;
 	} else if (rsm == NULL) {
 		goto out;
 	}
 	if (changed) {
 		/*
 		 * The ACK point is advancing to th_ack, we must drop off
 		 * the packets in the rack log and calculate any eligble
 		 * RTT's.
 		 */
 		bbr->r_wanted_output = 1;
 more:
 		if (rsm == NULL) {
 			if (tp->t_flags & TF_SENTFIN) {
 				/* if we send a FIN we will not hav a map */
 				goto proc_sack;
 			}
 #ifdef BBR_INVARIANTS
 			panic("No rack map tp:%p for th:%p state:%d bbr:%p snd_una:%u snd_max:%u chg:%d\n",
 			    tp,
 			    th, tp->t_state, bbr,
 			    tp->snd_una, tp->snd_max, changed);
 #endif
 			goto proc_sack;
 		}
 	}
 	if (SEQ_LT(th_ack, rsm->r_start)) {
 		/* Huh map is missing this */
 #ifdef BBR_INVARIANTS
 		printf("Rack map starts at r_start:%u for th_ack:%u huh? ts:%d rs:%d bbr:%p\n",
 		    rsm->r_start,
 		    th_ack, tp->t_state,
 		    bbr->r_state, bbr);
 		panic("th-ack is bad bbr:%p tp:%p", bbr, tp);
 #endif
 		goto proc_sack;
 	} else if (th_ack == rsm->r_start) {
 		/* None here to ack */
 		goto proc_sack;
 	}
 	/*
 	 * Clear the dup ack counter, it will
 	 * either be freed or if there is some
 	 * remaining we need to start it at zero.
 	 */
 	rsm->r_dupack = 0;
 	/* Now do we consume the whole thing? */
 	if (SEQ_GEQ(th_ack, rsm->r_end)) {
 		/* Its all consumed. */
 		uint32_t left;
 
 		if (rsm->r_flags & BBR_ACKED) {
 			/*
 			 * It was acked on the scoreboard -- remove it from
 			 * total
 			 */
 			p_acked += (rsm->r_end - rsm->r_start);
 			bbr->r_ctl.rc_sacked -= (rsm->r_end - rsm->r_start);
 			if (bbr->r_ctl.rc_sacked == 0)
 				bbr->r_ctl.rc_sacklast = NULL;
 		} else {
 			bbr_update_rtt(tp, bbr, rsm, to, cts, BBR_CUM_ACKED, th_ack);
 			if (rsm->r_flags & BBR_MARKED_LOST) {
 				bbr->r_ctl.rc_lost_bytes -= rsm->r_end - rsm->r_start;
 			}
 			if (rsm->r_flags & BBR_SACK_PASSED) {
 				/*
 				 * There are acked segments ACKED on the
 				 * scoreboard further up. We are seeing
 				 * reordering.
 				 */
 				BBR_STAT_INC(bbr_reorder_seen);
 				bbr->r_ctl.rc_reorder_ts = cts;
 				if (rsm->r_flags & BBR_MARKED_LOST) {
 					bbr->r_ctl.rc_lost -= rsm->r_end - rsm->r_start;
 					if (SEQ_GT(bbr->r_ctl.rc_lt_lost, bbr->r_ctl.rc_lost))
 						/* LT sampling also needs adjustment */
 						bbr->r_ctl.rc_lt_lost = bbr->r_ctl.rc_lost;
 				}
 			}
 			rsm->r_flags &= ~BBR_MARKED_LOST;
 		}
 		bbr->r_ctl.rc_holes_rxt -= rsm->r_rtr_bytes;
 		rsm->r_rtr_bytes = 0;
 		TAILQ_REMOVE(&bbr->r_ctl.rc_map, rsm, r_next);
 		if (rsm->r_in_tmap) {
 			TAILQ_REMOVE(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 			rsm->r_in_tmap = 0;
 		}
 		if (bbr->r_ctl.rc_next == rsm) {
 			/* scoot along the marker */
 			bbr->r_ctl.rc_next = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 		}
 		bbr_isit_a_pkt_epoch(bbr, cts, rsm, __LINE__, BBR_CUM_ACKED);
 		/* Adjust the packet counts */
 		left = th_ack - rsm->r_end;
 		/* Free back to zone */
 		bbr_free(bbr, rsm);
 		if (left) {
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 			goto more;
 		}
 		goto proc_sack;
 	}
 	if (rsm->r_flags & BBR_ACKED) {
 		/*
 		 * It was acked on the scoreboard -- remove it from total
 		 * for the part being cum-acked.
 		 */
 		p_acked += (rsm->r_end - rsm->r_start);
 		bbr->r_ctl.rc_sacked -= (th_ack - rsm->r_start);
 		if (bbr->r_ctl.rc_sacked == 0)
 			bbr->r_ctl.rc_sacklast = NULL;
 	} else {
 		/*
 		 * It was acked up to th_ack point for the first time
 		 */
 		struct bbr_sendmap lrsm;
 
 		memcpy(&lrsm, rsm, sizeof(struct bbr_sendmap));
 		lrsm.r_end = th_ack;
 		bbr_update_rtt(tp, bbr, &lrsm, to, cts, BBR_CUM_ACKED, th_ack);
 	}
 	if ((rsm->r_flags & BBR_MARKED_LOST) &&
 	    ((rsm->r_flags & BBR_ACKED) == 0)) {
 		/*
 		 * It was marked lost and partly ack'd now
 		 * for the first time. We lower the rc_lost_bytes
 		 * and still leave it MARKED.
 		 */
 		bbr->r_ctl.rc_lost_bytes -= th_ack - rsm->r_start;
 	}
 	bbr_isit_a_pkt_epoch(bbr, cts, rsm, __LINE__, BBR_CUM_ACKED);
 	bbr->r_ctl.rc_holes_rxt -= rsm->r_rtr_bytes;
 	rsm->r_rtr_bytes = 0;
 	/* adjust packet count */
 	rsm->r_start = th_ack;
 proc_sack:
 	/* Check for reneging */
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 	if (rsm && (rsm->r_flags & BBR_ACKED) && (th_ack == rsm->r_start)) {
 		/*
 		 * The peer has moved snd_una up to the edge of this send,
 		 * i.e. one that it had previously acked. The only way that
 		 * can be true if the peer threw away data (space issues)
 		 * that it had previously sacked (else it would have given
 		 * us snd_una up to (rsm->r_end). We need to undo the acked
 		 * markings here.
 		 *
 		 * Note we have to look to make sure th_ack is our
 		 * rsm->r_start in case we get an old ack where th_ack is
 		 * behind snd_una.
 		 */
 		bbr_peer_reneges(bbr, rsm, th->th_ack);
 	}
 	if ((to->to_flags & TOF_SACK) == 0) {
 		/* We are done nothing left to log */
 		goto out;
 	}
 	rsm = TAILQ_LAST_FAST(&bbr->r_ctl.rc_map, bbr_sendmap, r_next);
 	if (rsm) {
 		last_seq = rsm->r_end;
 	} else {
 		last_seq = tp->snd_max;
 	}
 	/* Sack block processing */
 	if (SEQ_GT(th_ack, tp->snd_una))
 		ack_point = th_ack;
 	else
 		ack_point = tp->snd_una;
 	for (i = 0; i < to->to_nsacks; i++) {
 		bcopy((to->to_sacks + i * TCPOLEN_SACK),
 		    &sack, sizeof(sack));
 		sack.start = ntohl(sack.start);
 		sack.end = ntohl(sack.end);
 		if (SEQ_GT(sack.end, sack.start) &&
 		    SEQ_GT(sack.start, ack_point) &&
 		    SEQ_LT(sack.start, tp->snd_max) &&
 		    SEQ_GT(sack.end, ack_point) &&
 		    SEQ_LEQ(sack.end, tp->snd_max)) {
 			if ((bbr->r_ctl.rc_num_small_maps_alloced > bbr_sack_block_limit) &&
 			    (SEQ_LT(sack.end, last_seq)) &&
 			    ((sack.end - sack.start) < (p_maxseg / 8))) {
 				/*
 				 * Not the last piece and its smaller than
 				 * 1/8th of a p_maxseg. We ignore this.
 				 */
 				BBR_STAT_INC(bbr_runt_sacks);
 				continue;
 			}
 			sack_blocks[num_sack_blks] = sack;
 			num_sack_blks++;
 		} else if (SEQ_LEQ(sack.start, th_ack) &&
 		    SEQ_LEQ(sack.end, th_ack)) {
 			/*
 			 * Its a D-SACK block.
 			 */
 			tcp_record_dsack(tp, sack.start, sack.end, 0);
 		}
 	}
 	if (num_sack_blks == 0)
 		goto out;
 	/*
 	 * Sort the SACK blocks so we can update the rack scoreboard with
 	 * just one pass.
 	 */
 	new_sb = sack_filter_blks(&bbr->r_ctl.bbr_sf, sack_blocks,
 				  num_sack_blks, th->th_ack);
 	ctf_log_sack_filter(bbr->rc_tp, new_sb, sack_blocks);
 	BBR_STAT_ADD(bbr_sack_blocks, num_sack_blks);
 	BBR_STAT_ADD(bbr_sack_blocks_skip, (num_sack_blks - new_sb));
 	num_sack_blks = new_sb;
 	if (num_sack_blks < 2) {
 		goto do_sack_work;
 	}
 	/* Sort the sacks */
 	for (i = 0; i < num_sack_blks; i++) {
 		for (j = i + 1; j < num_sack_blks; j++) {
 			if (SEQ_GT(sack_blocks[i].end, sack_blocks[j].end)) {
 				sack = sack_blocks[i];
 				sack_blocks[i] = sack_blocks[j];
 				sack_blocks[j] = sack;
 			}
 		}
 	}
 	/*
 	 * Now are any of the sack block ends the same (yes some
 	 * implememtations send these)?
 	 */
 again:
 	if (num_sack_blks > 1) {
 		for (i = 0; i < num_sack_blks; i++) {
 			for (j = i + 1; j < num_sack_blks; j++) {
 				if (sack_blocks[i].end == sack_blocks[j].end) {
 					/*
 					 * Ok these two have the same end we
 					 * want the smallest end and then
 					 * throw away the larger and start
 					 * again.
 					 */
 					if (SEQ_LT(sack_blocks[j].start, sack_blocks[i].start)) {
 						/*
 						 * The second block covers
 						 * more area use that
 						 */
 						sack_blocks[i].start = sack_blocks[j].start;
 					}
 					/*
 					 * Now collapse out the dup-sack and
 					 * lower the count
 					 */
 					for (k = (j + 1); k < num_sack_blks; k++) {
 						sack_blocks[j].start = sack_blocks[k].start;
 						sack_blocks[j].end = sack_blocks[k].end;
 						j++;
 					}
 					num_sack_blks--;
 					goto again;
 				}
 			}
 		}
 	}
 do_sack_work:
 	rsm = bbr->r_ctl.rc_sacklast;
 	for (i = 0; i < num_sack_blks; i++) {
 		acked = bbr_proc_sack_blk(tp, bbr, &sack_blocks[i], to, &rsm, cts);
 		if (acked) {
 			bbr->r_wanted_output = 1;
 			changed += acked;
 			sack_changed += acked;
 		}
 	}
 out:
 	*prev_acked = p_acked;
 	if ((sack_changed) && (!IN_RECOVERY(tp->t_flags))) {
 		/*
 		 * Ok we have a high probability that we need to go in to
 		 * recovery since we have data sack'd
 		 */
 		struct bbr_sendmap *rsm;
 
 		rsm = bbr_check_recovery_mode(tp, bbr, cts);
 		if (rsm) {
 			/* Enter recovery */
 			entered_recovery = 1;
 			bbr->r_wanted_output = 1;
 			/*
 			 * When we enter recovery we need to assure we send
 			 * one packet.
 			 */
 			if (bbr->r_ctl.rc_resend == NULL) {
 				bbr->r_ctl.rc_resend = rsm;
 			}
 		}
 	}
 	if (IN_RECOVERY(tp->t_flags) && (entered_recovery == 0)) {
 		/*
 		 * See if we need to rack-retransmit anything if so set it
 		 * up as the thing to resend assuming something else is not
 		 * already in that position.
 		 */
 		if (bbr->r_ctl.rc_resend == NULL) {
 			bbr->r_ctl.rc_resend = bbr_check_recovery_mode(tp, bbr, cts);
 		}
 	}
 	/*
 	 * We return the amount that changed via sack, this is used by the
 	 * ack-received code to augment what was changed between th_ack <->
 	 * snd_una.
 	 */
 	return (sack_changed);
 }
 
 static void
 bbr_strike_dupack(struct tcp_bbr *bbr)
 {
 	struct bbr_sendmap *rsm;
 
 	rsm = TAILQ_FIRST(&bbr->r_ctl.rc_tmap);
 	if (rsm && (rsm->r_dupack < 0xff)) {
 		rsm->r_dupack++;
 		if (rsm->r_dupack >= DUP_ACK_THRESHOLD)
 			bbr->r_wanted_output = 1;
 	}
 }
 
 /*
  * Return value of 1, we do not need to call bbr_process_data().
  * return value of 0, bbr_process_data can be called.
  * For ret_val if its 0 the TCB is locked and valid, if its non-zero
  * its unlocked and probably unsafe to touch the TCB.
  */
 static int
 bbr_process_ack(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to,
     uint32_t tiwin, int32_t tlen,
     int32_t * ofia, int32_t thflags, int32_t * ret_val)
 {
 	int32_t ourfinisacked = 0;
 	int32_t acked_amount;
 	uint16_t nsegs;
 	int32_t acked;
 	uint32_t lost, sack_changed = 0;
 	struct mbuf *mfree;
 	struct tcp_bbr *bbr;
 	uint32_t prev_acked = 0;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	lost = bbr->r_ctl.rc_lost;
 	nsegs = max(1, m->m_pkthdr.lro_nsegs);
 	if (SEQ_GT(th->th_ack, tp->snd_max)) {
 		ctf_do_dropafterack(m, tp, th, thflags, tlen, ret_val);
 		bbr->r_wanted_output = 1;
 		return (1);
 	}
 	if (SEQ_GEQ(th->th_ack, tp->snd_una) || to->to_nsacks) {
 		/* Process the ack */
 		if (bbr->rc_in_persist)
 			tp->t_rxtshift = 0;
 		if ((th->th_ack == tp->snd_una) && (tiwin == tp->snd_wnd))
 			bbr_strike_dupack(bbr);
 		sack_changed = bbr_log_ack(tp, to, th, &prev_acked);
 	}
 	bbr_lt_bw_sampling(bbr, bbr->r_ctl.rc_rcvtime, (bbr->r_ctl.rc_lost > lost));
 	if (__predict_false(SEQ_LEQ(th->th_ack, tp->snd_una))) {
 		/*
 		 * Old ack, behind the last one rcv'd or a duplicate ack
 		 * with SACK info.
 		 */
 		if (th->th_ack == tp->snd_una) {
 			bbr_ack_received(tp, bbr, th, 0, sack_changed, prev_acked, __LINE__, 0);
 			if (bbr->r_state == TCPS_SYN_SENT) {
 				/*
 				 * Special case on where we sent SYN. When
 				 * the SYN-ACK is processed in syn_sent
 				 * state it bumps the snd_una. This causes
 				 * us to hit here even though we did ack 1
 				 * byte.
 				 *
 				 * Go through the nothing left case so we
 				 * send data.
 				 */
 				goto nothing_left;
 			}
 		}
 		return (0);
 	}
 	/*
 	 * If we reach this point, ACK is not a duplicate, i.e., it ACKs
 	 * something we sent.
 	 */
 	if (tp->t_flags & TF_NEEDSYN) {
 		/*
 		 * T/TCP: Connection was half-synchronized, and our SYN has
 		 * been ACK'd (so connection is now fully synchronized).  Go
 		 * to non-starred state, increment snd_una for ACK of SYN,
 		 * and check if we can do window scaling.
 		 */
 		tp->t_flags &= ~TF_NEEDSYN;
 		tp->snd_una++;
 		/* Do window scaling? */
 		if ((tp->t_flags & (TF_RCVD_SCALE | TF_REQ_SCALE)) ==
 		    (TF_RCVD_SCALE | TF_REQ_SCALE)) {
 			tp->rcv_scale = tp->request_r_scale;
 			/* Send window already scaled. */
 		}
 	}
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	acked = BYTES_THIS_ACK(tp, th);
 	KMOD_TCPSTAT_ADD(tcps_rcvackpack, (int)nsegs);
 	KMOD_TCPSTAT_ADD(tcps_rcvackbyte, acked);
 
 	/*
 	 * If we just performed our first retransmit, and the ACK arrives
 	 * within our recovery window, then it was a mistake to do the
 	 * retransmit in the first place.  Recover our original cwnd and
 	 * ssthresh, and proceed to transmit where we left off.
 	 */
 	if (tp->t_flags & TF_PREVVALID) {
 		tp->t_flags &= ~TF_PREVVALID;
 		if (tp->t_rxtshift == 1 &&
 		    (int)(ticks - tp->t_badrxtwin) < 0)
 			bbr_cong_signal(tp, th, CC_RTO_ERR, NULL);
 	}
 	SOCKBUF_LOCK(&so->so_snd);
 	acked_amount = min(acked, (int)sbavail(&so->so_snd));
 	tp->snd_wnd -= acked_amount;
 	mfree = sbcut_locked(&so->so_snd, acked_amount);
 	/* NB: sowwakeup_locked() does an implicit unlock. */
 	sowwakeup_locked(so);
 	m_freem(mfree);
 	if (SEQ_GT(th->th_ack, tp->snd_una)) {
 		bbr_collapse_rtt(tp, bbr, TCP_REXMTVAL(tp));
 	}
 	tp->snd_una = th->th_ack;
 	bbr_ack_received(tp, bbr, th, acked, sack_changed, prev_acked, __LINE__, (bbr->r_ctl.rc_lost - lost));
 	if (IN_RECOVERY(tp->t_flags)) {
 		if (SEQ_LT(th->th_ack, tp->snd_recover) &&
 		    (SEQ_LT(th->th_ack, tp->snd_max))) {
 			tcp_bbr_partialack(tp);
 		} else {
 			bbr_post_recovery(tp);
 		}
 	}
 	if (SEQ_GT(tp->snd_una, tp->snd_recover)) {
 		tp->snd_recover = tp->snd_una;
 	}
 	if (SEQ_LT(tp->snd_nxt, tp->snd_max)) {
 		tp->snd_nxt = tp->snd_max;
 	}
 	if (tp->snd_una == tp->snd_max) {
 		/* Nothing left outstanding */
 nothing_left:
 		bbr_log_progress_event(bbr, tp, ticks, PROGRESS_CLEAR, __LINE__);
 		if (sbavail(&so->so_snd) == 0)
 			bbr->rc_tp->t_acktime = 0;
 		if ((sbused(&so->so_snd) == 0) &&
 		    (tp->t_flags & TF_SENTFIN)) {
 			ourfinisacked = 1;
 		}
 		bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 		if (bbr->rc_in_persist == 0) {
 			bbr->r_ctl.rc_went_idle_time = bbr->r_ctl.rc_rcvtime;
 		}
 		sack_filter_clear(&bbr->r_ctl.bbr_sf, tp->snd_una);
 		bbr_log_ack_clear(bbr, bbr->r_ctl.rc_rcvtime);
 		/*
 		 * We invalidate the last ack here since we
 		 * don't want to transfer forward the time
 		 * for our sum's calculations.
 		 */
 		if ((tp->t_state >= TCPS_FIN_WAIT_1) &&
 		    (sbavail(&so->so_snd) == 0) &&
 		    (tp->t_flags2 & TF2_DROP_AF_DATA)) {
 			/*
 			 * The socket was gone and the peer sent data, time
 			 * to reset him.
 			 */
 			*ret_val = 1;
 			tcp_log_end_status(tp, TCP_EI_STATUS_DATA_A_CLOSE);
 			/* tcp_close will kill the inp pre-log the Reset */
 			tcp_log_end_status(tp, TCP_EI_STATUS_SERVER_RST);
 			tp = tcp_close(tp);
 			ctf_do_dropwithreset(m, tp, th, BANDLIM_UNLIMITED, tlen);
 			BBR_STAT_INC(bbr_dropped_af_data);
 			return (1);
 		}
 		/* Set need output so persist might get set */
 		bbr->r_wanted_output = 1;
 	}
 	if (ofia)
 		*ofia = ourfinisacked;
 	return (0);
 }
 
 static void
 bbr_enter_persist(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	if (bbr->rc_in_persist == 0) {
 		bbr_timer_cancel(bbr, __LINE__, cts);
 		bbr->r_ctl.rc_last_delay_val = 0;
 		tp->t_rxtshift = 0;
 		bbr->rc_in_persist = 1;
 		bbr->r_ctl.rc_went_idle_time = cts;
 		/* We should be capped when rw went to 0 but just in case */
 		bbr_log_type_pesist(bbr, cts, 0, line, 1);
 		/* Time freezes for the state, so do the accounting now */
 		if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 			uint32_t time_in;
 
 			time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 			if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW) {
 				int32_t idx;
 
 				idx = bbr_state_val(bbr);
 				counter_u64_add(bbr_state_time[(idx + 5)], time_in);
 			} else {
 				counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 			}
 		}
 		bbr->r_ctl.rc_bbr_state_time = cts;
 	}
 }
 
 static void
 bbr_restart_after_idle(struct tcp_bbr *bbr, uint32_t cts, uint32_t idle_time)
 {
 	/*
 	 * Note that if idle time does not exceed our
 	 * threshold, we do nothing continuing the state
 	 * transitions we were last walking through.
 	 */
 	if (idle_time >= bbr_idle_restart_threshold) {
 		if (bbr->rc_use_idle_restart) {
 			bbr->rc_bbr_state = BBR_STATE_IDLE_EXIT;
 			/*
 			 * Set our target using BBR_UNIT, so
 			 * we increase at a dramatic rate but
 			 * we stop when we get the pipe
 			 * full again for our current b/w estimate.
 			 */
 			bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 			bbr->r_ctl.rc_bbr_cwnd_gain = BBR_UNIT;
 			bbr_set_state_target(bbr, __LINE__);
 			/* Now setup our gains to ramp up */
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.rc_startup_pg;
 			bbr->r_ctl.rc_bbr_cwnd_gain = bbr->r_ctl.rc_startup_pg;
 			bbr_log_type_statechange(bbr, cts, __LINE__);
 		} else if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW) {
 			bbr_substate_change(bbr, cts, __LINE__, 1);
 		}
 	}
 }
 
 static void
 bbr_exit_persist(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	uint32_t idle_time;
 
 	if (bbr->rc_in_persist == 0)
 		return;
 	idle_time = bbr_calc_time(cts, bbr->r_ctl.rc_went_idle_time);
 	bbr->rc_in_persist = 0;
 	bbr->rc_hit_state_1 = 0;
 	bbr->r_ctl.rc_del_time = cts;
 	/*
 	 * We invalidate the last ack here since we
 	 * don't want to transfer forward the time
 	 * for our sum's calculations.
 	 */
 	if (tcp_in_hpts(bbr->rc_tp)) {
 		tcp_hpts_remove(bbr->rc_tp);
 		bbr->rc_timer_first = 0;
 		bbr->r_ctl.rc_hpts_flags = 0;
 		bbr->r_ctl.rc_last_delay_val = 0;
 		bbr->r_ctl.rc_hptsi_agg_delay = 0;
 		bbr->r_agg_early_set = 0;
 		bbr->r_ctl.rc_agg_early = 0;
 	}
 	bbr_log_type_pesist(bbr, cts, idle_time, line, 0);
 	if (idle_time >= bbr_rtt_probe_time) {
 		/*
 		 * This qualifies as a RTT_PROBE session since we drop the
 		 * data outstanding to nothing and waited more than
 		 * bbr_rtt_probe_time.
 		 */
 		bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_PERSIST, 0);
 		bbr->r_ctl.last_in_probertt = bbr->r_ctl.rc_rtt_shrinks = cts;
 	}
 	tp->t_rxtshift = 0;
 	/*
 	 * If in probeBW and we have persisted more than an RTT lets do
 	 * special handling.
 	 */
 	/* Force a time based epoch */
 	bbr_set_epoch(bbr, cts, __LINE__);
 	/*
 	 * Setup the lost so we don't count anything against the guy
 	 * we have been stuck with during persists.
 	 */
 	bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 	/* Time un-freezes for the state */
 	bbr->r_ctl.rc_bbr_state_time = cts;
 	if ((bbr->rc_bbr_state == BBR_STATE_PROBE_BW) ||
 	    (bbr->rc_bbr_state == BBR_STATE_PROBE_RTT)) {
 		/*
 		 * If we are going back to probe-bw
 		 * or probe_rtt, we may need to possibly
 		 * do a fast restart.
 		 */
 		bbr_restart_after_idle(bbr, cts, idle_time);
 	}
 }
 
 static void
 bbr_collapsed_window(struct tcp_bbr *bbr)
 {
 	/*
 	 * Now we must walk the
 	 * send map and divide the
 	 * ones left stranded. These
 	 * guys can't cause us to abort
 	 * the connection and are really
 	 * "unsent". However if a buggy
 	 * client actually did keep some
 	 * of the data i.e. collapsed the win
 	 * and refused to ack and then opened
 	 * the win and acked that data. We would
 	 * get into an ack war, the simplier
 	 * method then of just pretending we
 	 * did not send those segments something
 	 * won't work.
 	 */
 	struct bbr_sendmap *rsm, *nrsm;
 	tcp_seq max_seq;
 	uint32_t maxseg;
 	int can_split = 0;
 	int fnd = 0;
 
 	maxseg = bbr->rc_tp->t_maxseg - bbr->rc_last_options;
 	max_seq = bbr->rc_tp->snd_una + bbr->rc_tp->snd_wnd;
 	bbr_log_type_rwnd_collapse(bbr, max_seq, 1, 0);
 	TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_map, r_next) {
 		/* Find the first seq past or at maxseq */
 		if (rsm->r_flags & BBR_RWND_COLLAPSED)
 			rsm->r_flags &= ~BBR_RWND_COLLAPSED;
 		if (SEQ_GEQ(max_seq, rsm->r_start) &&
 		    SEQ_GEQ(rsm->r_end, max_seq)) {
 			fnd = 1;
 			break;
 		}
 	}
 	bbr->rc_has_collapsed = 0;
 	if (!fnd) {
 		/* Nothing to do strange */
 		return;
 	}
 	/*
 	 * Now can we split?
 	 *
 	 * We don't want to split if splitting
 	 * would generate too many small segments
 	 * less we let an attacker fragment our
 	 * send_map and leave us out of memory.
 	 */
 	if ((max_seq != rsm->r_start) &&
 	    (max_seq != rsm->r_end)){
 		/* can we split? */
 		int res1, res2;
 
 		res1 = max_seq - rsm->r_start;
 		res2 = rsm->r_end - max_seq;
 		if ((res1 >= (maxseg/8)) &&
 		    (res2 >= (maxseg/8))) {
 			/* No small pieces here */
 			can_split = 1;
 		} else if (bbr->r_ctl.rc_num_small_maps_alloced < bbr_sack_block_limit) {
 			/* We are under the limit */
 			can_split = 1;
 		}
 	}
 	/* Ok do we need to split this rsm? */
 	if (max_seq == rsm->r_start) {
 		/* It's this guy no split required */
 		nrsm = rsm;
 	} else if (max_seq == rsm->r_end) {
 		/* It's the next one no split required. */
 		nrsm = TAILQ_NEXT(rsm, r_next);
 		if (nrsm == NULL) {
 			/* Huh? */
 			return;
 		}
 	} else if (can_split && SEQ_LT(max_seq, rsm->r_end)) {
 		/* yep we need to split it */
 		nrsm = bbr_alloc_limit(bbr, BBR_LIMIT_TYPE_SPLIT);
 		if (nrsm == NULL) {
 			/* failed XXXrrs what can we do mark the whole? */
 			nrsm = rsm;
 			goto no_split;
 		}
 		/* Clone it */
 		bbr_log_type_rwnd_collapse(bbr, max_seq, 3, 0);
 		bbr_clone_rsm(bbr, nrsm, rsm, max_seq);
 		TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_map, rsm, nrsm, r_next);
 		if (rsm->r_in_tmap) {
 			TAILQ_INSERT_AFTER(&bbr->r_ctl.rc_tmap, rsm, nrsm, r_tnext);
 			nrsm->r_in_tmap = 1;
 		}
 	} else {
 		/*
 		 * Split not allowed just start here just
 		 * use this guy.
 		 */
 		nrsm = rsm;
 	}
 no_split:
 	BBR_STAT_INC(bbr_collapsed_win);
 	/* reuse fnd as a count */
 	fnd = 0;
 	TAILQ_FOREACH_FROM(nrsm, &bbr->r_ctl.rc_map, r_next) {
 		nrsm->r_flags |= BBR_RWND_COLLAPSED;
 		fnd++;
 		bbr->rc_has_collapsed = 1;
 	}
 	bbr_log_type_rwnd_collapse(bbr, max_seq, 4, fnd);
 }
 
 static void
 bbr_un_collapse_window(struct tcp_bbr *bbr)
 {
 	struct bbr_sendmap *rsm;
 	int cleared = 0;
 
 	TAILQ_FOREACH_REVERSE(rsm, &bbr->r_ctl.rc_map, bbr_head, r_next) {
 		if (rsm->r_flags & BBR_RWND_COLLAPSED) {
 			/* Clear the flag */
 			rsm->r_flags &= ~BBR_RWND_COLLAPSED;
 			cleared++;
 		} else
 			break;
 	}
 	bbr_log_type_rwnd_collapse(bbr,
 				   (bbr->rc_tp->snd_una + bbr->rc_tp->snd_wnd), 0, cleared);
 	bbr->rc_has_collapsed = 0;
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_process_data(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt)
 {
 	/*
 	 * Update window information. Don't look at window if no ACK: TAC's
 	 * send garbage on first SYN.
 	 */
 	uint16_t nsegs;
 	int32_t tfo_syn;
 	struct tcp_bbr *bbr;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	nsegs = max(1, m->m_pkthdr.lro_nsegs);
 	if ((thflags & TH_ACK) &&
 	    (SEQ_LT(tp->snd_wl1, th->th_seq) ||
 	    (tp->snd_wl1 == th->th_seq && (SEQ_LT(tp->snd_wl2, th->th_ack) ||
 	    (tp->snd_wl2 == th->th_ack && tiwin > tp->snd_wnd))))) {
 		/* keep track of pure window updates */
 		if (tlen == 0 &&
 		    tp->snd_wl2 == th->th_ack && tiwin > tp->snd_wnd)
 			KMOD_TCPSTAT_INC(tcps_rcvwinupd);
 		tp->snd_wnd = tiwin;
 		tp->snd_wl1 = th->th_seq;
 		tp->snd_wl2 = th->th_ack;
 		if (tp->snd_wnd > tp->max_sndwnd)
 			tp->max_sndwnd = tp->snd_wnd;
 		bbr->r_wanted_output = 1;
 	} else if (thflags & TH_ACK) {
 		if ((tp->snd_wl2 == th->th_ack) && (tiwin < tp->snd_wnd)) {
 			tp->snd_wnd = tiwin;
 			tp->snd_wl1 = th->th_seq;
 			tp->snd_wl2 = th->th_ack;
 		}
 	}
 	if (tp->snd_wnd < ctf_outstanding(tp))
 		/* The peer collapsed its window on us */
 		bbr_collapsed_window(bbr);
  	else if (bbr->rc_has_collapsed)
 		bbr_un_collapse_window(bbr);
 	/* Was persist timer active and now we have window space? */
 	if ((bbr->rc_in_persist != 0) &&
 	    (tp->snd_wnd >= min((bbr->r_ctl.rc_high_rwnd/2),
 				bbr_minseg(bbr)))) {
 		/*
 		 * Make the rate persist at end of persist mode if idle long
 		 * enough
 		 */
 		bbr_exit_persist(tp, bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 
 		/* Make sure we output to start the timer */
 		bbr->r_wanted_output = 1;
 	}
 	/* Do we need to enter persist? */
 	if ((bbr->rc_in_persist == 0) &&
 	    (tp->snd_wnd < min((bbr->r_ctl.rc_high_rwnd/2), bbr_minseg(bbr))) &&
 	    TCPS_HAVEESTABLISHED(tp->t_state) &&
 	    (tp->snd_max == tp->snd_una) &&
 	    sbavail(&so->so_snd) &&
 	    (sbavail(&so->so_snd) > tp->snd_wnd)) {
 		/* No send window.. we must enter persist */
 		bbr_enter_persist(tp, bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 	}
 	if (tp->t_flags2 & TF2_DROP_AF_DATA) {
 		m_freem(m);
 		return (0);
 	}
 	/*
 	 * We don't support urgent data but
 	 * drag along the up just to make sure
 	 * if there is a stack switch no one
 	 * is surprised.
 	 */
 	tp->rcv_up = tp->rcv_nxt;
 
 	/*
 	 * Process the segment text, merging it into the TCP sequencing
 	 * queue, and arranging for acknowledgment of receipt if necessary.
 	 * This process logically involves adjusting tp->rcv_wnd as data is
 	 * presented to the user (this happens in tcp_usrreq.c, case
 	 * PRU_RCVD).  If a FIN has already been received on this connection
 	 * then we just ignore the text.
 	 */
 	tfo_syn = ((tp->t_state == TCPS_SYN_RECEIVED) &&
 		   IS_FASTOPEN(tp->t_flags));
 	if ((tlen || (thflags & TH_FIN) || (tfo_syn && tlen > 0)) &&
 	    TCPS_HAVERCVDFIN(tp->t_state) == 0) {
 		tcp_seq save_start = th->th_seq;
 		tcp_seq save_rnxt  = tp->rcv_nxt;
 		int     save_tlen  = tlen;
 
 		m_adj(m, drop_hdrlen);	/* delayed header drop */
 		/*
 		 * Insert segment which includes th into TCP reassembly
 		 * queue with control block tp.  Set thflags to whether
 		 * reassembly now includes a segment with FIN.  This handles
 		 * the common case inline (segment is the next to be
 		 * received on an established connection, and the queue is
 		 * empty), avoiding linkage into and removal from the queue
 		 * and repetition of various conversions. Set DELACK for
 		 * segments received in order, but ack immediately when
 		 * segments are out of order (so fast retransmit can work).
 		 */
 		if (th->th_seq == tp->rcv_nxt &&
 		    SEGQ_EMPTY(tp) &&
 		    (TCPS_HAVEESTABLISHED(tp->t_state) ||
 		    tfo_syn)) {
 #ifdef NETFLIX_SB_LIMITS
 			u_int mcnt, appended;
 
 			if (so->so_rcv.sb_shlim) {
 				mcnt = m_memcnt(m);
 				appended = 0;
 				if (counter_fo_get(so->so_rcv.sb_shlim, mcnt,
 				    CFO_NOSLEEP, NULL) == false) {
 					counter_u64_add(tcp_sb_shlim_fails, 1);
 					m_freem(m);
 					return (0);
 				}
 			}
 
 #endif
 			if (DELAY_ACK(tp, bbr, nsegs) || tfo_syn) {
 				bbr->bbr_segs_rcvd += max(1, nsegs);
 				tp->t_flags |= TF_DELACK;
 				bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 			} else {
 				bbr->r_wanted_output = 1;
 				tp->t_flags |= TF_ACKNOW;
 			}
 			tp->rcv_nxt += tlen;
 			if (tlen &&
 			    ((tp->t_flags2 & TF2_FBYTES_COMPLETE) == 0) &&
 			    (tp->t_fbyte_in == 0)) {
 				tp->t_fbyte_in = ticks;
 				if (tp->t_fbyte_in == 0)
 					tp->t_fbyte_in = 1;
 				if (tp->t_fbyte_out && tp->t_fbyte_in)
 					tp->t_flags2 |= TF2_FBYTES_COMPLETE;
 			}
 			thflags = tcp_get_flags(th) & TH_FIN;
 			KMOD_TCPSTAT_ADD(tcps_rcvpack, (int)nsegs);
 			KMOD_TCPSTAT_ADD(tcps_rcvbyte, tlen);
 			SOCKBUF_LOCK(&so->so_rcv);
 			if (so->so_rcv.sb_state & SBS_CANTRCVMORE)
 				m_freem(m);
 			else
 #ifdef NETFLIX_SB_LIMITS
 				appended =
 #endif
 					sbappendstream_locked(&so->so_rcv, m, 0);
 			/* NB: sorwakeup_locked() does an implicit unlock. */
 			sorwakeup_locked(so);
 #ifdef NETFLIX_SB_LIMITS
 			if (so->so_rcv.sb_shlim && appended != mcnt)
 				counter_fo_release(so->so_rcv.sb_shlim,
 				    mcnt - appended);
 #endif
 
 		} else {
 			/*
 			 * XXX: Due to the header drop above "th" is
 			 * theoretically invalid by now.  Fortunately
 			 * m_adj() doesn't actually frees any mbufs when
 			 * trimming from the head.
 			 */
 			tcp_seq temp = save_start;
 
 			thflags = tcp_reass(tp, th, &temp, &tlen, m);
 			tp->t_flags |= TF_ACKNOW;
 			if (tp->t_flags & TF_WAKESOR) {
 				tp->t_flags &= ~TF_WAKESOR;
 				/* NB: sorwakeup_locked() does an implicit unlock. */
 				sorwakeup_locked(so);
 			}
 		}
 		if ((tp->t_flags & TF_SACK_PERMIT) &&
 		    (save_tlen > 0) &&
 		    TCPS_HAVEESTABLISHED(tp->t_state)) {
 			if ((tlen == 0) && (SEQ_LT(save_start, save_rnxt))) {
 				/*
 				 * DSACK actually handled in the fastpath
 				 * above.
 				 */
 				tcp_update_sack_list(tp, save_start,
 				    save_start + save_tlen);
 			} else if ((tlen > 0) && SEQ_GT(tp->rcv_nxt, save_rnxt)) {
 				if ((tp->rcv_numsacks >= 1) &&
 				    (tp->sackblks[0].end == save_start)) {
 					/*
 					 * Partial overlap, recorded at todrop
 					 * above.
 					 */
 					tcp_update_sack_list(tp,
 					    tp->sackblks[0].start,
 					    tp->sackblks[0].end);
 				} else {
 					tcp_update_dsack_list(tp, save_start,
 					    save_start + save_tlen);
 				}
 			} else if (tlen >= save_tlen) {
 				/* Update of sackblks. */
 				tcp_update_dsack_list(tp, save_start,
 				    save_start + save_tlen);
 			} else if (tlen > 0) {
 				tcp_update_dsack_list(tp, save_start,
 				    save_start + tlen);
 			}
 		}
 	} else {
 		m_freem(m);
 		thflags &= ~TH_FIN;
 	}
 
 	/*
 	 * If FIN is received ACK the FIN and let the user know that the
 	 * connection is closing.
 	 */
 	if (thflags & TH_FIN) {
 		if (TCPS_HAVERCVDFIN(tp->t_state) == 0) {
 			/* The socket upcall is handled by socantrcvmore. */
 			socantrcvmore(so);
 			/*
 			 * If connection is half-synchronized (ie NEEDSYN
 			 * flag on) then delay ACK, so it may be piggybacked
 			 * when SYN is sent. Otherwise, since we received a
 			 * FIN then no more input can be expected, send ACK
 			 * now.
 			 */
 			if (tp->t_flags & TF_NEEDSYN) {
 				tp->t_flags |= TF_DELACK;
 				bbr_timer_cancel(bbr,
 				    __LINE__, bbr->r_ctl.rc_rcvtime);
 			} else {
 				tp->t_flags |= TF_ACKNOW;
 			}
 			tp->rcv_nxt++;
 		}
 		switch (tp->t_state) {
 			/*
 			 * In SYN_RECEIVED and ESTABLISHED STATES enter the
 			 * CLOSE_WAIT state.
 			 */
 		case TCPS_SYN_RECEIVED:
 			tp->t_starttime = ticks;
 			/* FALLTHROUGH */
 		case TCPS_ESTABLISHED:
 			tcp_state_change(tp, TCPS_CLOSE_WAIT);
 			break;
 
 			/*
 			 * If still in FIN_WAIT_1 STATE FIN has not been
 			 * acked so enter the CLOSING state.
 			 */
 		case TCPS_FIN_WAIT_1:
 			tcp_state_change(tp, TCPS_CLOSING);
 			break;
 
 			/*
 			 * In FIN_WAIT_2 state enter the TIME_WAIT state,
 			 * starting the time-wait timer, turning off the
 			 * other standard timers.
 			 */
 		case TCPS_FIN_WAIT_2:
 			bbr->rc_timer_first = 1;
 			bbr_timer_cancel(bbr,
 			    __LINE__, bbr->r_ctl.rc_rcvtime);
 			tcp_twstart(tp);
 			return (1);
 		}
 	}
 	/*
 	 * Return any desired output.
 	 */
 	if ((tp->t_flags & TF_ACKNOW) ||
 	    (sbavail(&so->so_snd) > ctf_outstanding(tp))) {
 		bbr->r_wanted_output = 1;
 	}
 	return (0);
 }
 
 /*
  * Here nothing is really faster, its just that we
  * have broken out the fast-data path also just like
  * the fast-ack. Return 1 if we processed the packet
  * return 0 if you need to take the "slow-path".
  */
 static int
 bbr_do_fastnewdata(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t nxt_pkt)
 {
 	uint16_t nsegs;
 	int32_t newsize = 0;	/* automatic sockbuf scaling */
 	struct tcp_bbr *bbr;
 #ifdef NETFLIX_SB_LIMITS
 	u_int mcnt, appended;
 #endif
 
 	/* On the hpts and we would have called output */
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * the timestamp. NOTE that the test is modified according to the
 	 * latest proposal of the tcplw@cray.com list (Braden 1993/04/26).
 	 */
 	if (bbr->r_ctl.rc_resend != NULL) {
 		return (0);
 	}
 	if (tiwin && tiwin != tp->snd_wnd) {
 		return (0);
 	}
 	if (__predict_false((tp->t_flags & (TF_NEEDSYN | TF_NEEDFIN)))) {
 		return (0);
 	}
 	if (__predict_false((to->to_flags & TOF_TS) &&
 	    (TSTMP_LT(to->to_tsval, tp->ts_recent)))) {
 		return (0);
 	}
 	if (__predict_false((th->th_ack != tp->snd_una))) {
 		return (0);
 	}
 	if (__predict_false(tlen > sbspace(&so->so_rcv))) {
 		return (0);
 	}
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent)) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * This is a pure, in-sequence data packet with nothing on the
 	 * reassembly queue and we have enough buffer space to take it.
 	 */
 	nsegs = max(1, m->m_pkthdr.lro_nsegs);
 
 #ifdef NETFLIX_SB_LIMITS
 	if (so->so_rcv.sb_shlim) {
 		mcnt = m_memcnt(m);
 		appended = 0;
 		if (counter_fo_get(so->so_rcv.sb_shlim, mcnt,
 		    CFO_NOSLEEP, NULL) == false) {
 			counter_u64_add(tcp_sb_shlim_fails, 1);
 			m_freem(m);
 			return (1);
 		}
 	}
 #endif
 	/* Clean receiver SACK report if present */
 	if (tp->rcv_numsacks)
 		tcp_clean_sackreport(tp);
 	KMOD_TCPSTAT_INC(tcps_preddat);
 	tp->rcv_nxt += tlen;
 	if (tlen &&
 	    ((tp->t_flags2 & TF2_FBYTES_COMPLETE) == 0) &&
 	    (tp->t_fbyte_in == 0)) {
 		tp->t_fbyte_in = ticks;
 		if (tp->t_fbyte_in == 0)
 			tp->t_fbyte_in = 1;
 		if (tp->t_fbyte_out && tp->t_fbyte_in)
 			tp->t_flags2 |= TF2_FBYTES_COMPLETE;
 	}
 	/*
 	 * Pull snd_wl1 up to prevent seq wrap relative to th_seq.
 	 */
 	tp->snd_wl1 = th->th_seq;
 	/*
 	 * Pull rcv_up up to prevent seq wrap relative to rcv_nxt.
 	 */
 	tp->rcv_up = tp->rcv_nxt;
 	KMOD_TCPSTAT_ADD(tcps_rcvpack, (int)nsegs);
 	KMOD_TCPSTAT_ADD(tcps_rcvbyte, tlen);
 	newsize = tcp_autorcvbuf(m, th, so, tp, tlen);
 
 	/* Add data to socket buffer. */
 	SOCKBUF_LOCK(&so->so_rcv);
 	if (so->so_rcv.sb_state & SBS_CANTRCVMORE) {
 		m_freem(m);
 	} else {
 		/*
 		 * Set new socket buffer size. Give up when limit is
 		 * reached.
 		 */
 		if (newsize)
 			if (!sbreserve_locked(so, SO_RCV, newsize, NULL))
 				so->so_rcv.sb_flags &= ~SB_AUTOSIZE;
 		m_adj(m, drop_hdrlen);	/* delayed header drop */
 
 #ifdef NETFLIX_SB_LIMITS
 		appended =
 #endif
 			sbappendstream_locked(&so->so_rcv, m, 0);
 		ctf_calc_rwin(so, tp);
 	}
 	/* NB: sorwakeup_locked() does an implicit unlock. */
 	sorwakeup_locked(so);
 #ifdef NETFLIX_SB_LIMITS
 	if (so->so_rcv.sb_shlim && mcnt != appended)
 		counter_fo_release(so->so_rcv.sb_shlim, mcnt - appended);
 #endif
 	if (DELAY_ACK(tp, bbr, nsegs)) {
 		bbr->bbr_segs_rcvd += max(1, nsegs);
 		tp->t_flags |= TF_DELACK;
 		bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 	} else {
 		bbr->r_wanted_output = 1;
 		tp->t_flags |= TF_ACKNOW;
 	}
 	return (1);
 }
 
 /*
  * This subfunction is used to try to highly optimize the
  * fast path. We again allow window updates that are
  * in sequence to remain in the fast-path. We also add
  * in the __predict's to attempt to help the compiler.
  * Note that if we return a 0, then we can *not* process
  * it and the caller should push the packet into the
  * slow-path. If we return 1, then all is well and
  * the packet is fully processed.
  */
 static int
 bbr_fastack(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t acked;
 	uint16_t nsegs;
 	uint32_t sack_changed;
 	uint32_t prev_acked = 0;
 	struct tcp_bbr *bbr;
 
 	if (__predict_false(SEQ_LEQ(th->th_ack, tp->snd_una))) {
 		/* Old ack, behind (or duplicate to) the last one rcv'd */
 		return (0);
 	}
 	if (__predict_false(SEQ_GT(th->th_ack, tp->snd_max))) {
 		/* Above what we have sent? */
 		return (0);
 	}
 	if (__predict_false(tiwin == 0)) {
 		/* zero window */
 		return (0);
 	}
 	if (__predict_false(tp->t_flags & (TF_NEEDSYN | TF_NEEDFIN))) {
 		/* We need a SYN or a FIN, unlikely.. */
 		return (0);
 	}
 	if ((to->to_flags & TOF_TS) && __predict_false(TSTMP_LT(to->to_tsval, tp->ts_recent))) {
 		/* Timestamp is behind .. old ack with seq wrap? */
 		return (0);
 	}
 	if (__predict_false(IN_RECOVERY(tp->t_flags))) {
 		/* Still recovering */
 		return (0);
 	}
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	if (__predict_false(bbr->r_ctl.rc_resend != NULL)) {
 		/* We are retransmitting */
 		return (0);
 	}
 	if (__predict_false(bbr->rc_in_persist != 0)) {
 		/* In persist mode */
 		return (0);
 	}
 	if (bbr->r_ctl.rc_sacked) {
 		/* We have sack holes on our scoreboard */
 		return (0);
 	}
 	/* Ok if we reach here, we can process a fast-ack */
 	nsegs = max(1, m->m_pkthdr.lro_nsegs);
 	sack_changed = bbr_log_ack(tp, to, th, &prev_acked);
 	/*
 	 * We never detect loss in fast ack [we can't
 	 * have a sack and can't be in recovery so
 	 * we always pass 0 (nothing detected)].
 	 */
 	bbr_lt_bw_sampling(bbr, bbr->r_ctl.rc_rcvtime, 0);
 	/* Did the window get updated? */
 	if (tiwin != tp->snd_wnd) {
 		tp->snd_wnd = tiwin;
 		tp->snd_wl1 = th->th_seq;
 		if (tp->snd_wnd > tp->max_sndwnd)
 			tp->max_sndwnd = tp->snd_wnd;
 	}
 	/* Do we need to exit persists? */
 	if ((bbr->rc_in_persist != 0) &&
 	    (tp->snd_wnd >= min((bbr->r_ctl.rc_high_rwnd/2),
 			       bbr_minseg(bbr)))) {
 		bbr_exit_persist(tp, bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 		bbr->r_wanted_output = 1;
 	}
 	/* Do we need to enter persists? */
 	if ((bbr->rc_in_persist == 0) &&
 	    (tp->snd_wnd < min((bbr->r_ctl.rc_high_rwnd/2), bbr_minseg(bbr))) &&
 	    TCPS_HAVEESTABLISHED(tp->t_state) &&
 	    (tp->snd_max == tp->snd_una) &&
 	    sbavail(&so->so_snd) &&
 	    (sbavail(&so->so_snd) > tp->snd_wnd)) {
 		/* No send window.. we must enter persist */
 		bbr_enter_persist(tp, bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 	}
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * the timestamp. NOTE that the test is modified according to the
 	 * latest proposal of the tcplw@cray.com list (Braden 1993/04/26).
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent)) {
 		tp->ts_recent_age = bbr->r_ctl.rc_rcvtime;
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * This is a pure ack for outstanding data.
 	 */
 	KMOD_TCPSTAT_INC(tcps_predack);
 
 	/*
 	 * "bad retransmit" recovery.
 	 */
 	if (tp->t_flags & TF_PREVVALID) {
 		tp->t_flags &= ~TF_PREVVALID;
 		if (tp->t_rxtshift == 1 &&
 		    (int)(ticks - tp->t_badrxtwin) < 0)
 			bbr_cong_signal(tp, th, CC_RTO_ERR, NULL);
 	}
 	/*
 	 * Recalculate the transmit timer / rtt.
 	 *
 	 * Some boxes send broken timestamp replies during the SYN+ACK
 	 * phase, ignore timestamps of 0 or we could calculate a huge RTT
 	 * and blow up the retransmit timer.
 	 */
 	acked = BYTES_THIS_ACK(tp, th);
 
 #ifdef TCP_HHOOK
 	/* Run HHOOK_TCP_ESTABLISHED_IN helper hooks. */
 	hhook_run_tcp_est_in(tp, th, to);
 #endif
 
 	KMOD_TCPSTAT_ADD(tcps_rcvackpack, (int)nsegs);
 	KMOD_TCPSTAT_ADD(tcps_rcvackbyte, acked);
 	sbdrop(&so->so_snd, acked);
 
 	if (SEQ_GT(th->th_ack, tp->snd_una))
 		bbr_collapse_rtt(tp, bbr, TCP_REXMTVAL(tp));
 	tp->snd_una = th->th_ack;
 	if (tp->snd_wnd < ctf_outstanding(tp))
 		/* The peer collapsed its window on us */
 		bbr_collapsed_window(bbr);
 	else if (bbr->rc_has_collapsed)
 		bbr_un_collapse_window(bbr);
 
 	if (SEQ_GT(tp->snd_una, tp->snd_recover)) {
 		tp->snd_recover = tp->snd_una;
 	}
 	bbr_ack_received(tp, bbr, th, acked, sack_changed, prev_acked, __LINE__, 0);
 	/*
 	 * Pull snd_wl2 up to prevent seq wrap relative to th_ack.
 	 */
 	tp->snd_wl2 = th->th_ack;
 	m_freem(m);
 	/*
 	 * If all outstanding data are acked, stop retransmit timer,
 	 * otherwise restart timer using current (possibly backed-off)
 	 * value. If process is waiting for space, wakeup/selwakeup/signal.
 	 * If data are ready to send, let tcp_output decide between more
 	 * output or persist.
 	 * Wake up the socket if we have room to write more.
 	 */
 	sowwakeup(so);
 	if (tp->snd_una == tp->snd_max) {
 		/* Nothing left outstanding */
 		bbr_log_progress_event(bbr, tp, ticks, PROGRESS_CLEAR, __LINE__);
 		if (sbavail(&so->so_snd) == 0)
 			bbr->rc_tp->t_acktime = 0;
 		bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 		if (bbr->rc_in_persist == 0) {
 			bbr->r_ctl.rc_went_idle_time = bbr->r_ctl.rc_rcvtime;
 		}
 		sack_filter_clear(&bbr->r_ctl.bbr_sf, tp->snd_una);
 		bbr_log_ack_clear(bbr, bbr->r_ctl.rc_rcvtime);
 		/*
 		 * We invalidate the last ack here since we
 		 * don't want to transfer forward the time
 		 * for our sum's calculations.
 		 */
 		bbr->r_wanted_output = 1;
 	}
 	if (sbavail(&so->so_snd)) {
 		bbr->r_wanted_output = 1;
 	}
 	return (1);
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_syn_sent(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t todrop;
 	int32_t ourfinisacked = 0;
 	struct tcp_bbr *bbr;
 	int32_t ret_val = 0;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	/*
 	 * If the state is SYN_SENT: if seg contains an ACK, but not for our
 	 * SYN, drop the input. if seg contains a RST, then drop the
 	 * connection. if seg does not contain SYN, then drop it. Otherwise
 	 * this is an acceptable SYN segment initialize tp->rcv_nxt and
 	 * tp->irs if seg contains ack then advance tp->snd_una. BRR does
 	 * not support ECN so we will not say we are capable. if SYN has
 	 * been acked change to ESTABLISHED else SYN_RCVD state arrange for
 	 * segment to be acked (eventually) continue processing rest of
 	 * data/controls, beginning with URG
 	 */
 	if ((thflags & TH_ACK) &&
 	    (SEQ_LEQ(th->th_ack, tp->iss) ||
 	    SEQ_GT(th->th_ack, tp->snd_max))) {
 		tcp_log_end_status(tp, TCP_EI_STATUS_RST_IN_FRONT);
 		ctf_do_dropwithreset(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 		return (1);
 	}
 	if ((thflags & (TH_ACK | TH_RST)) == (TH_ACK | TH_RST)) {
 		TCP_PROBE5(connect__refused, NULL, tp,
 		    mtod(m, const char *), tp, th);
 		tp = tcp_drop(tp, ECONNREFUSED);
 		ctf_do_drop(m, tp);
 		return (1);
 	}
 	if (thflags & TH_RST) {
 		ctf_do_drop(m, tp);
 		return (1);
 	}
 	if (!(thflags & TH_SYN)) {
 		ctf_do_drop(m, tp);
 		return (1);
 	}
 	tp->irs = th->th_seq;
 	tcp_rcvseqinit(tp);
 	if (thflags & TH_ACK) {
 		int tfo_partial = 0;
 
 		KMOD_TCPSTAT_INC(tcps_connects);
 		soisconnected(so);
 #ifdef MAC
 		mac_socketpeer_set_from_mbuf(m, so);
 #endif
 		/* Do window scaling on this connection? */
 		if ((tp->t_flags & (TF_RCVD_SCALE | TF_REQ_SCALE)) ==
 		    (TF_RCVD_SCALE | TF_REQ_SCALE)) {
 			tp->rcv_scale = tp->request_r_scale;
 		}
 		tp->rcv_adv += min(tp->rcv_wnd,
 		    TCP_MAXWIN << tp->rcv_scale);
 		/*
 		 * If not all the data that was sent in the TFO SYN
 		 * has been acked, resend the remainder right away.
 		 */
 		if (IS_FASTOPEN(tp->t_flags) &&
 		    (tp->snd_una != tp->snd_max)) {
 			tp->snd_nxt = th->th_ack;
 			tfo_partial = 1;
 		}
 		/*
 		 * If there's data, delay ACK; if there's also a FIN ACKNOW
 		 * will be turned on later.
 		 */
 		if (DELAY_ACK(tp, bbr, 1) && tlen != 0 && !tfo_partial) {
 			bbr->bbr_segs_rcvd += 1;
 			tp->t_flags |= TF_DELACK;
 			bbr_timer_cancel(bbr, __LINE__, bbr->r_ctl.rc_rcvtime);
 		} else {
 			bbr->r_wanted_output = 1;
 			tp->t_flags |= TF_ACKNOW;
 		}
 		if (SEQ_GT(th->th_ack, tp->iss)) {
 			/*
 			 * The SYN is acked
 			 * handle it specially.
 			 */
 			bbr_log_syn(tp, to);
 		}
 		if (SEQ_GT(th->th_ack, tp->snd_una)) {
 			/*
 			 * We advance snd_una for the
 			 * fast open case. If th_ack is
 			 * acknowledging data beyond
 			 * snd_una we can't just call
 			 * ack-processing since the
 			 * data stream in our send-map
 			 * will start at snd_una + 1 (one
 			 * beyond the SYN). If its just
 			 * equal we don't need to do that
 			 * and there is no send_map.
 			 */
 			tp->snd_una++;
 		}
 		/*
 		 * Received <SYN,ACK> in SYN_SENT[*] state. Transitions:
 		 * SYN_SENT  --> ESTABLISHED SYN_SENT* --> FIN_WAIT_1
 		 */
 		tp->t_starttime = ticks;
 		if (tp->t_flags & TF_NEEDFIN) {
 			tcp_state_change(tp, TCPS_FIN_WAIT_1);
 			tp->t_flags &= ~TF_NEEDFIN;
 			thflags &= ~TH_SYN;
 		} else {
 			tcp_state_change(tp, TCPS_ESTABLISHED);
 			TCP_PROBE5(connect__established, NULL, tp,
 			    mtod(m, const char *), tp, th);
 			cc_conn_init(tp);
 		}
 	} else {
 		/*
 		 * Received initial SYN in SYN-SENT[*] state => simultaneous
 		 * open.  If segment contains CC option and there is a
 		 * cached CC, apply TAO test. If it succeeds, connection is *
 		 * half-synchronized. Otherwise, do 3-way handshake:
 		 * SYN-SENT -> SYN-RECEIVED SYN-SENT* -> SYN-RECEIVED* If
 		 * there was no CC option, clear cached CC value.
 		 */
 		tp->t_flags |= (TF_ACKNOW | TF_NEEDSYN | TF_SONOTCONN);
 		tcp_state_change(tp, TCPS_SYN_RECEIVED);
 	}
 	/*
 	 * Advance th->th_seq to correspond to first data byte. If data,
 	 * trim to stay within window, dropping FIN if necessary.
 	 */
 	th->th_seq++;
 	if (tlen > tp->rcv_wnd) {
 		todrop = tlen - tp->rcv_wnd;
 		m_adj(m, -todrop);
 		tlen = tp->rcv_wnd;
 		thflags &= ~TH_FIN;
 		KMOD_TCPSTAT_INC(tcps_rcvpackafterwin);
 		KMOD_TCPSTAT_ADD(tcps_rcvbyteafterwin, todrop);
 	}
 	tp->snd_wl1 = th->th_seq - 1;
 	tp->rcv_up = th->th_seq;
 	/*
 	 * Client side of transaction: already sent SYN and data. If the
 	 * remote host used T/TCP to validate the SYN, our data will be
 	 * ACK'd; if so, enter normal data segment processing in the middle
 	 * of step 5, ack processing. Otherwise, goto step 6.
 	 */
 	if (thflags & TH_ACK) {
 		if ((to->to_flags & TOF_TS) != 0) {
 			uint32_t t, rtt;
 
 			t = tcp_tv_to_mssectick(&bbr->rc_tv);
 			if (TSTMP_GEQ(t, to->to_tsecr)) {
 				rtt = t - to->to_tsecr;
 				if (rtt == 0) {
 					rtt = 1;
 				}
 				rtt *= MS_IN_USEC;
 				tcp_bbr_xmit_timer(bbr, rtt, 0, 0, 0);
 				apply_filter_min_small(&bbr->r_ctl.rc_rttprop,
 						       rtt, bbr->r_ctl.rc_rcvtime);
 			}
 		}
 		if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val))
 			return (ret_val);
 		/* We may have changed to FIN_WAIT_1 above */
 		if (tp->t_state == TCPS_FIN_WAIT_1) {
 			/*
 			 * In FIN_WAIT_1 STATE in addition to the processing
 			 * for the ESTABLISHED state if our FIN is now
 			 * acknowledged then enter FIN_WAIT_2.
 			 */
 			if (ourfinisacked) {
 				/*
 				 * If we can't receive any more data, then
 				 * closing user can proceed. Starting the
 				 * timer is contrary to the specification,
 				 * but if we don't get a FIN we'll hang
 				 * forever.
 				 *
 				 * XXXjl: we should release the tp also, and
 				 * use a compressed state.
 				 */
 				if (so->so_rcv.sb_state & SBS_CANTRCVMORE) {
 					soisdisconnected(so);
 					tcp_timer_activate(tp, TT_2MSL,
 					    (tcp_fast_finwait2_recycle ?
 					    tcp_finwait2_timeout :
 					    TP_MAXIDLE(tp)));
 				}
 				tcp_state_change(tp, TCPS_FIN_WAIT_2);
 			}
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_syn_recv(struct mbuf *m, struct tcphdr *th, struct socket *so,
 		struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
 		uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t ourfinisacked = 0;
 	int32_t ret_val;
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	if ((thflags & TH_ACK) &&
 	    (SEQ_LEQ(th->th_ack, tp->snd_una) ||
 	     SEQ_GT(th->th_ack, tp->snd_max))) {
 		tcp_log_end_status(tp, TCP_EI_STATUS_RST_IN_FRONT);
 		ctf_do_dropwithreset(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 		return (1);
 	}
 	if (IS_FASTOPEN(tp->t_flags)) {
 		/*
 		 * When a TFO connection is in SYN_RECEIVED, the only valid
 		 * packets are the initial SYN, a retransmit/copy of the
 		 * initial SYN (possibly with a subset of the original
 		 * data), a valid ACK, a FIN, or a RST.
 		 */
 		if ((thflags & (TH_SYN | TH_ACK)) == (TH_SYN | TH_ACK)) {
 			tcp_log_end_status(tp, TCP_EI_STATUS_RST_IN_FRONT);
 			ctf_do_dropwithreset(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		} else if (thflags & TH_SYN) {
 			/* non-initial SYN is ignored */
 			if ((bbr->r_ctl.rc_hpts_flags & PACE_TMR_RXT) ||
 			    (bbr->r_ctl.rc_hpts_flags & PACE_TMR_TLP) ||
 			    (bbr->r_ctl.rc_hpts_flags & PACE_TMR_RACK)) {
 				ctf_do_drop(m, NULL);
 				return (0);
 			}
 		} else if (!(thflags & (TH_ACK | TH_FIN | TH_RST))) {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	/*
 	 * In the SYN-RECEIVED state, validate that the packet belongs to
 	 * this connection before trimming the data to fit the receive
 	 * window.  Check the sequence number versus IRS since we know the
 	 * sequence numbers haven't wrapped.  This is a partial fix for the
 	 * "LAND" DoS attack.
 	 */
 	if (SEQ_LT(th->th_seq, tp->irs)) {
 		tcp_log_end_status(tp, TCP_EI_STATUS_RST_IN_FRONT);
 		ctf_do_dropwithreset(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 		return (1);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 		    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	tp->snd_wnd = tiwin;
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (IS_FASTOPEN(tp->t_flags)) {
 			cc_conn_init(tp);
 		}
 		return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 					 tiwin, thflags, nxt_pkt));
 	}
 	KMOD_TCPSTAT_INC(tcps_connects);
 	if (tp->t_flags & TF_SONOTCONN) {
 		tp->t_flags &= ~TF_SONOTCONN;
 		soisconnected(so);
 	}
 	/* Do window scaling? */
 	if ((tp->t_flags & (TF_RCVD_SCALE | TF_REQ_SCALE)) ==
 	    (TF_RCVD_SCALE | TF_REQ_SCALE)) {
 		tp->rcv_scale = tp->request_r_scale;
 	}
 	/*
 	 * ok for the first time in lets see if we can use the ts to figure
 	 * out what the initial RTT was.
 	 */
 	if ((to->to_flags & TOF_TS) != 0) {
 		uint32_t t, rtt;
 
 		t = tcp_tv_to_mssectick(&bbr->rc_tv);
 		if (TSTMP_GEQ(t, to->to_tsecr)) {
 			rtt = t - to->to_tsecr;
 			if (rtt == 0) {
 				rtt = 1;
 			}
 			rtt *= MS_IN_USEC;
 			tcp_bbr_xmit_timer(bbr, rtt, 0, 0, 0);
 			apply_filter_min_small(&bbr->r_ctl.rc_rttprop, rtt, bbr->r_ctl.rc_rcvtime);
 		}
 	}
 	/* Drop off any SYN in the send map (probably not there)  */
 	if (thflags & TH_ACK)
 		bbr_log_syn(tp, to);
 	if (IS_FASTOPEN(tp->t_flags) && tp->t_tfo_pending) {
 		tcp_fastopen_decrement_counter(tp->t_tfo_pending);
 		tp->t_tfo_pending = NULL;
 	}
 	/*
 	 * Make transitions: SYN-RECEIVED  -> ESTABLISHED SYN-RECEIVED* ->
 	 * FIN-WAIT-1
 	 */
 	tp->t_starttime = ticks;
 	if (tp->t_flags & TF_NEEDFIN) {
 		tcp_state_change(tp, TCPS_FIN_WAIT_1);
 		tp->t_flags &= ~TF_NEEDFIN;
 	} else {
 		tcp_state_change(tp, TCPS_ESTABLISHED);
 		TCP_PROBE5(accept__established, NULL, tp,
 			   mtod(m, const char *), tp, th);
 		/*
 		 * TFO connections call cc_conn_init() during SYN
 		 * processing.  Calling it again here for such connections
 		 * is not harmless as it would undo the snd_cwnd reduction
 		 * that occurs when a TFO SYN|ACK is retransmitted.
 		 */
 		if (!IS_FASTOPEN(tp->t_flags))
 			cc_conn_init(tp);
 	}
 	/*
 	 * Account for the ACK of our SYN prior to
 	 * regular ACK processing below, except for
 	 * simultaneous SYN, which is handled later.
 	 */
 	if (SEQ_GT(th->th_ack, tp->snd_una) && !(tp->t_flags & TF_NEEDSYN))
 		tp->snd_una++;
 	/*
 	 * If segment contains data or ACK, will call tcp_reass() later; if
 	 * not, do so now to pass queued data to user.
 	 */
 	if (tlen == 0 && (thflags & TH_FIN) == 0) {
 		(void)tcp_reass(tp, (struct tcphdr *)0, NULL, 0,
 			(struct mbuf *)0);
 		if (tp->t_flags & TF_WAKESOR) {
 			tp->t_flags &= ~TF_WAKESOR;
 			/* NB: sorwakeup_locked() does an implicit unlock. */
 			sorwakeup_locked(so);
 		}
 	}
 	tp->snd_wl1 = th->th_seq - 1;
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (tp->t_state == TCPS_FIN_WAIT_1) {
 		/* We could have went to FIN_WAIT_1 (or EST) above */
 		/*
 		 * In FIN_WAIT_1 STATE in addition to the processing for the
 		 * ESTABLISHED state if our FIN is now acknowledged then
 		 * enter FIN_WAIT_2.
 		 */
 		if (ourfinisacked) {
 			/*
 			 * If we can't receive any more data, then closing
 			 * user can proceed. Starting the timer is contrary
 			 * to the specification, but if we don't get a FIN
 			 * we'll hang forever.
 			 *
 			 * XXXjl: we should release the tp also, and use a
 			 * compressed state.
 			 */
 			if (so->so_rcv.sb_state & SBS_CANTRCVMORE) {
 				soisdisconnected(so);
 				tcp_timer_activate(tp, TT_2MSL,
 						   (tcp_fast_finwait2_recycle ?
 						    tcp_finwait2_timeout :
 						    TP_MAXIDLE(tp)));
 			}
 			tcp_state_change(tp, TCPS_FIN_WAIT_2);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 				 tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_established(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	struct tcp_bbr *bbr;
 	int32_t ret_val;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	/*
 	 * Header prediction: check for the two common cases of a
 	 * uni-directional data xfer.  If the packet has no control flags,
 	 * is in-sequence, the window didn't change and we're not
 	 * retransmitting, it's a candidate.  If the length is zero and the
 	 * ack moved forward, we're the sender side of the xfer.  Just free
 	 * the data acked & wake any higher level process that was blocked
 	 * waiting for space.  If the length is non-zero and the ack didn't
 	 * move, we're the receiver side.  If we're getting packets in-order
 	 * (the reassembly queue is empty), add the data toc The socket
 	 * buffer and note that we need a delayed ack. Make sure that the
 	 * hidden state-flags are also off. Since we check for
 	 * TCPS_ESTABLISHED first, it can only be TH_NEEDSYN.
 	 */
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	if (bbr->r_ctl.rc_delivered < (4 * tp->t_maxseg)) {
 		/*
 		 * If we have delived under 4 segments increase the initial
 		 * window if raised by the peer. We use this to determine
 		 * dynamic and static rwnd's at the end of a connection.
 		 */
 		bbr->r_ctl.rc_init_rwnd = max(tiwin, tp->snd_wnd);
 	}
 	if (__predict_true(((to->to_flags & TOF_SACK) == 0)) &&
 	    __predict_true((thflags & (TH_SYN | TH_FIN | TH_RST | TH_URG | TH_ACK)) == TH_ACK) &&
 	    __predict_true(SEGQ_EMPTY(tp)) &&
 	    __predict_true(th->th_seq == tp->rcv_nxt)) {
 		if (tlen == 0) {
 			if (bbr_fastack(m, th, so, tp, to, drop_hdrlen, tlen,
 			    tiwin, nxt_pkt, iptos)) {
 				return (0);
 			}
 		} else {
 			if (bbr_do_fastnewdata(m, th, so, tp, to, drop_hdrlen, tlen,
 			    tiwin, nxt_pkt)) {
 				return (0);
 			}
 		}
 	}
 	ctf_calc_rwin(so, tp);
 
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, NULL, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	/* State changes only happen in bbr_process_data() */
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_close_wait(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	struct tcp_bbr *bbr;
 	int32_t ret_val;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, NULL, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 static int
 bbr_check_data_after_close(struct mbuf *m, struct tcp_bbr *bbr,
     struct tcpcb *tp, int32_t * tlen, struct tcphdr *th, struct socket *so)
 {
 
 	if (bbr->rc_allow_data_af_clo == 0) {
 close_now:
 		tcp_log_end_status(tp, TCP_EI_STATUS_DATA_A_CLOSE);
 		/* tcp_close will kill the inp pre-log the Reset */
 		tcp_log_end_status(tp, TCP_EI_STATUS_SERVER_RST);
 		tp = tcp_close(tp);
 		KMOD_TCPSTAT_INC(tcps_rcvafterclose);
 		ctf_do_dropwithreset(m, tp, th, BANDLIM_UNLIMITED, (*tlen));
 		return (1);
 	}
 	if (sbavail(&so->so_snd) == 0)
 		goto close_now;
 	/* Ok we allow data that is ignored and a followup reset */
 	tp->rcv_nxt = th->th_seq + *tlen;
 	tp->t_flags2 |= TF2_DROP_AF_DATA;
 	bbr->r_wanted_output = 1;
 	*tlen = 0;
 	return (0);
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_fin_wait_1(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t ourfinisacked = 0;
 	int32_t ret_val;
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If new data are received on a connection after the user processes
 	 * are gone, then RST the other end.
 	 * We call a new function now so we might continue and setup
 	 * to reset at all data being ack'd.
 	 */
 	if ((tp->t_flags & TF_CLOSED) && tlen &&
 	    bbr_check_data_after_close(m, bbr, tp, &tlen, th, so))
 		return (1);
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (ourfinisacked) {
 		/*
 		 * If we can't receive any more data, then closing user can
 		 * proceed. Starting the timer is contrary to the
 		 * specification, but if we don't get a FIN we'll hang
 		 * forever.
 		 *
 		 * XXXjl: we should release the tp also, and use a
 		 * compressed state.
 		 */
 		if (so->so_rcv.sb_state & SBS_CANTRCVMORE) {
 			soisdisconnected(so);
 			tcp_timer_activate(tp, TT_2MSL,
 			    (tcp_fast_finwait2_recycle ?
 			    tcp_finwait2_timeout :
 			    TP_MAXIDLE(tp)));
 		}
 		tcp_state_change(tp, TCPS_FIN_WAIT_2);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_closing(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t ourfinisacked = 0;
 	int32_t ret_val;
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If new data are received on a connection after the user processes
 	 * are gone, then RST the other end.
 	 * We call a new function now so we might continue and setup
 	 * to reset at all data being ack'd.
 	 */
 	if ((tp->t_flags & TF_CLOSED) && tlen &&
 	    bbr_check_data_after_close(m, bbr, tp, &tlen, th, so))
 		return (1);
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (ourfinisacked) {
 		tcp_twstart(tp);
 		m_freem(m);
 		return (1);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_lastack(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t ourfinisacked = 0;
 	int32_t ret_val;
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If new data are received on a connection after the user processes
 	 * are gone, then RST the other end.
 	 * We call a new function now so we might continue and setup
 	 * to reset at all data being ack'd.
 	 */
 	if ((tp->t_flags & TF_CLOSED) && tlen &&
 	    bbr_check_data_after_close(m, bbr, tp, &tlen, th, so))
 		return (1);
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * case TCPS_LAST_ACK: Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (ourfinisacked) {
 		tp = tcp_close(tp);
 		ctf_do_drop(m, tp);
 		return (1);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 /*
  * Return value of 1, the TCB is unlocked and most
  * likely gone, return value of 0, the TCB is still
  * locked.
  */
 static int
 bbr_do_fin_wait_2(struct mbuf *m, struct tcphdr *th, struct socket *so,
     struct tcpcb *tp, struct tcpopt *to, int32_t drop_hdrlen, int32_t tlen,
     uint32_t tiwin, int32_t thflags, int32_t nxt_pkt, uint8_t iptos)
 {
 	int32_t ourfinisacked = 0;
 	int32_t ret_val;
 	struct tcp_bbr *bbr;
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	ctf_calc_rwin(so, tp);
 	/* Reset receive buffer auto scaling when not in bulk receive mode. */
 	if ((thflags & TH_RST) ||
 	    (tp->t_fin_is_rst && (thflags & TH_FIN)))
 		return (ctf_process_rst(m, th, so, tp));
 
 	/*
 	 * RFC5961 Section 4.2 Send challenge ACK for any SYN in
 	 * synchronized state.
 	 */
 	if (thflags & TH_SYN) {
 		ctf_challenge_ack(m, th, tp, iptos, &ret_val);
 		return (ret_val);
 	}
 	/*
 	 * RFC 1323 PAWS: If we have a timestamp reply on this segment and
 	 * it's less than ts_recent, drop it.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 && tp->ts_recent &&
 	    TSTMP_LT(to->to_tsval, tp->ts_recent)) {
 		if (ctf_ts_check(m, th, tp, tlen, thflags, &ret_val))
 			return (ret_val);
 	}
 	if (ctf_drop_checks(to, m, th, tp, &tlen, &thflags, &drop_hdrlen, &ret_val)) {
 		return (ret_val);
 	}
 	/*
 	 * If new data are received on a connection after the user processes
 	 * are gone, then we may RST the other end depending on the outcome
 	 * of bbr_check_data_after_close.
 	 * We call a new function now so we might continue and setup
 	 * to reset at all data being ack'd.
 	 */
 	if ((tp->t_flags & TF_CLOSED) && tlen &&
 	    bbr_check_data_after_close(m, bbr, tp, &tlen, th, so))
 		return (1);
 	/*
 	 * If last ACK falls within this segment's sequence numbers, record
 	 * its timestamp. NOTE: 1) That the test incorporates suggestions
 	 * from the latest proposal of the tcplw@cray.com list (Braden
 	 * 1993/04/26). 2) That updating only on newer timestamps interferes
 	 * with our earlier PAWS tests, so this check should be solely
 	 * predicated on the sequence space of this segment. 3) That we
 	 * modify the segment boundary check to be Last.ACK.Sent <= SEG.SEQ
 	 * + SEG.Len  instead of RFC1323's Last.ACK.Sent < SEG.SEQ +
 	 * SEG.Len, This modified check allows us to overcome RFC1323's
 	 * limitations as described in Stevens TCP/IP Illustrated Vol. 2
 	 * p.869. In such cases, we can still calculate the RTT correctly
 	 * when RCV.NXT == Last.ACK.Sent.
 	 */
 	if ((to->to_flags & TOF_TS) != 0 &&
 	    SEQ_LEQ(th->th_seq, tp->last_ack_sent) &&
 	    SEQ_LEQ(tp->last_ack_sent, th->th_seq + tlen +
 	    ((thflags & (TH_SYN | TH_FIN)) != 0))) {
 		tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 		tp->ts_recent = to->to_tsval;
 	}
 	/*
 	 * If the ACK bit is off:  if in SYN-RECEIVED state or SENDSYN flag
 	 * is on (half-synchronized state), then queue data for later
 	 * processing; else drop segment and return.
 	 */
 	if ((thflags & TH_ACK) == 0) {
 		if (tp->t_flags & TF_NEEDSYN) {
 			return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 			    tiwin, thflags, nxt_pkt));
 		} else if (tp->t_flags & TF_ACKNOW) {
 			ctf_do_dropafterack(m, tp, th, thflags, tlen, &ret_val);
 			bbr->r_wanted_output = 1;
 			return (ret_val);
 		} else {
 			ctf_do_drop(m, NULL);
 			return (0);
 		}
 	}
 	/*
 	 * Ack processing.
 	 */
 	if (bbr_process_ack(m, th, so, tp, to, tiwin, tlen, &ourfinisacked, thflags, &ret_val)) {
 		return (ret_val);
 	}
 	if (sbavail(&so->so_snd)) {
 		if (ctf_progress_timeout_check(tp, true)) {
 			bbr_log_progress_event(bbr, tp, tick, PROGRESS_DROP, __LINE__);
 			ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 			return (1);
 		}
 	}
 	return (bbr_process_data(m, th, so, tp, drop_hdrlen, tlen,
 	    tiwin, thflags, nxt_pkt));
 }
 
 static void
 bbr_stop_all_timers(struct tcpcb *tp, struct tcp_bbr *bbr)
 {
 	/*
 	 * Assure no timers are running.
 	 */
 	if (tcp_timer_active(tp, TT_PERSIST)) {
 		/* We enter in persists, set the flag appropriately */
 		bbr->rc_in_persist = 1;
 	}
 	if (tcp_in_hpts(bbr->rc_tp)) {
 		tcp_hpts_remove(bbr->rc_tp);
 	}
 }
 
 static void
 bbr_google_mode_on(struct tcp_bbr *bbr)
 {
 	bbr->rc_use_google = 1;
 	bbr->rc_no_pacing = 0;
 	bbr->r_ctl.bbr_google_discount = bbr_google_discount;
 	bbr->r_use_policer = bbr_policer_detection_enabled;
 	bbr->r_ctl.rc_probertt_int = (USECS_IN_SECOND * 10);
 	bbr->bbr_use_rack_cheat = 0;
 	bbr->r_ctl.rc_incr_tmrs = 0;
 	bbr->r_ctl.rc_inc_tcp_oh = 0;
 	bbr->r_ctl.rc_inc_ip_oh = 0;
 	bbr->r_ctl.rc_inc_enet_oh = 0;
 	reset_time(&bbr->r_ctl.rc_delrate,
 		   BBR_NUM_RTTS_FOR_GOOG_DEL_LIMIT);
 	reset_time_small(&bbr->r_ctl.rc_rttprop,
 			 (11 * USECS_IN_SECOND));
 	tcp_bbr_tso_size_check(bbr, tcp_get_usecs(&bbr->rc_tv));
 }
 
 static void
 bbr_google_mode_off(struct tcp_bbr *bbr)
 {
 	bbr->rc_use_google = 0;
 	bbr->r_ctl.bbr_google_discount = 0;
 	bbr->no_pacing_until = bbr_no_pacing_until;
 	bbr->r_use_policer = 0;
 	if (bbr->no_pacing_until)
 		bbr->rc_no_pacing = 1;
 	else
 		bbr->rc_no_pacing = 0;
 	if (bbr_use_rack_resend_cheat)
 		bbr->bbr_use_rack_cheat = 1;
 	else
 		bbr->bbr_use_rack_cheat = 0;
 	if (bbr_incr_timers)
 		bbr->r_ctl.rc_incr_tmrs = 1;
 	else
 		bbr->r_ctl.rc_incr_tmrs = 0;
 	if (bbr_include_tcp_oh)
 		bbr->r_ctl.rc_inc_tcp_oh = 1;
 	else
 		bbr->r_ctl.rc_inc_tcp_oh = 0;
 	if (bbr_include_ip_oh)
 		bbr->r_ctl.rc_inc_ip_oh = 1;
 	else
 		bbr->r_ctl.rc_inc_ip_oh = 0;
 	if (bbr_include_enet_oh)
 		bbr->r_ctl.rc_inc_enet_oh = 1;
 	else
 		bbr->r_ctl.rc_inc_enet_oh = 0;
 	bbr->r_ctl.rc_probertt_int = bbr_rtt_probe_limit;
 	reset_time(&bbr->r_ctl.rc_delrate,
 		   bbr_num_pktepo_for_del_limit);
 	reset_time_small(&bbr->r_ctl.rc_rttprop,
 			 (bbr_filter_len_sec * USECS_IN_SECOND));
 	tcp_bbr_tso_size_check(bbr, tcp_get_usecs(&bbr->rc_tv));
 }
 /*
  * Return 0 on success, non-zero on failure
  * which indicates the error (usually no memory).
  */
 static int
 bbr_init(struct tcpcb *tp, void **ptr)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_bbr *bbr = NULL;
 	uint32_t cts;
 
 	*ptr = uma_zalloc(bbr_pcb_zone, (M_NOWAIT | M_ZERO));
 	if (*ptr == NULL) {
 		/*
 		 * We need to allocate memory but cant. The INP and INP_INFO
 		 * locks and they are recursive (happens during setup. So a
 		 * scheme to drop the locks fails :(
 		 *
 		 */
 		return (ENOMEM);
 	}
 	bbr = (struct tcp_bbr *)*ptr;
 	bbr->rtt_valid = 0;
 	tp->t_flags2 |= TF2_CANNOT_DO_ECN;
 	tp->t_flags2 |= TF2_SUPPORTS_MBUFQ;
 	/* Take off any undesired flags */
 	tp->t_flags2 &= ~TF2_MBUF_QUEUE_READY;
 	tp->t_flags2 &= ~TF2_DONT_SACK_QUEUE;
 	tp->t_flags2 &= ~TF2_MBUF_ACKCMP;
 	tp->t_flags2 &= ~TF2_MBUF_L_ACKS;
 
 	TAILQ_INIT(&bbr->r_ctl.rc_map);
 	TAILQ_INIT(&bbr->r_ctl.rc_free);
 	TAILQ_INIT(&bbr->r_ctl.rc_tmap);
 	bbr->rc_tp = tp;
 	bbr->rc_inp = inp;
 	cts = tcp_get_usecs(&bbr->rc_tv);
 	tp->t_acktime = 0;
 	bbr->rc_allow_data_af_clo = bbr_ignore_data_after_close;
 	bbr->r_ctl.rc_reorder_fade = bbr_reorder_fade;
 	bbr->rc_tlp_threshold = bbr_tlp_thresh;
 	bbr->r_ctl.rc_reorder_shift = bbr_reorder_thresh;
 	bbr->r_ctl.rc_pkt_delay = bbr_pkt_delay;
 	bbr->r_ctl.rc_min_to = bbr_min_to;
 	bbr->rc_bbr_state = BBR_STATE_STARTUP;
 	bbr->r_ctl.bbr_lost_at_state = 0;
 	bbr->r_ctl.rc_lost_at_startup = 0;
 	bbr->rc_all_timers_stopped = 0;
 	bbr->r_ctl.rc_bbr_lastbtlbw = 0;
 	bbr->r_ctl.rc_pkt_epoch_del = 0;
 	bbr->r_ctl.rc_pkt_epoch = 0;
 	bbr->r_ctl.rc_lowest_rtt = 0xffffffff;
 	bbr->r_ctl.rc_bbr_hptsi_gain = bbr_high_gain;
 	bbr->r_ctl.rc_bbr_cwnd_gain = bbr_high_gain;
 	bbr->r_ctl.rc_went_idle_time = cts;
 	bbr->rc_pacer_started = cts;
 	bbr->r_ctl.rc_pkt_epoch_time = cts;
 	bbr->r_ctl.rc_rcvtime = cts;
 	bbr->r_ctl.rc_bbr_state_time = cts;
 	bbr->r_ctl.rc_del_time = cts;
 	bbr->r_ctl.rc_tlp_rxt_last_time = cts;
 	bbr->r_ctl.last_in_probertt = cts;
 	bbr->skip_gain = 0;
 	bbr->gain_is_limited = 0;
 	bbr->no_pacing_until = bbr_no_pacing_until;
 	if (bbr->no_pacing_until)
 		bbr->rc_no_pacing = 1;
 	if (bbr_use_google_algo) {
 		bbr->rc_no_pacing = 0;
 		bbr->rc_use_google = 1;
 		bbr->r_ctl.bbr_google_discount = bbr_google_discount;
 		bbr->r_use_policer = bbr_policer_detection_enabled;
 	} else {
 		bbr->rc_use_google = 0;
 		bbr->r_ctl.bbr_google_discount = 0;
 		bbr->r_use_policer = 0;
 	}
 	if (bbr_ts_limiting)
 		bbr->rc_use_ts_limit = 1;
 	else
 		bbr->rc_use_ts_limit = 0;
 	if (bbr_ts_can_raise)
 		bbr->ts_can_raise = 1;
 	else
 		bbr->ts_can_raise = 0;
 	if (V_tcp_delack_enabled == 1)
 		tp->t_delayed_ack = 2;
 	else if (V_tcp_delack_enabled == 0)
 		tp->t_delayed_ack = 0;
 	else if (V_tcp_delack_enabled < 100)
 		tp->t_delayed_ack = V_tcp_delack_enabled;
 	else
 		tp->t_delayed_ack = 2;
 	if (bbr->rc_use_google == 0)
 		bbr->r_ctl.rc_probertt_int = bbr_rtt_probe_limit;
 	else
 		bbr->r_ctl.rc_probertt_int = (USECS_IN_SECOND * 10);
 	bbr->r_ctl.rc_min_rto_ms = bbr_rto_min_ms;
 	bbr->rc_max_rto_sec = bbr_rto_max_sec;
 	bbr->rc_init_win = bbr_def_init_win;
 	if (tp->t_flags & TF_REQ_TSTMP)
 		bbr->rc_last_options = TCP_TS_OVERHEAD;
 	bbr->r_ctl.rc_pace_max_segs = tp->t_maxseg - bbr->rc_last_options;
 	bbr->r_ctl.rc_high_rwnd = tp->snd_wnd;
 	bbr->r_init_rtt = 1;
 
 	counter_u64_add(bbr_flows_nohdwr_pacing, 1);
 	if (bbr_allow_hdwr_pacing)
 		bbr->bbr_hdw_pace_ena = 1;
 	else
 		bbr->bbr_hdw_pace_ena = 0;
 	if (bbr_sends_full_iwnd)
 		bbr->bbr_init_win_cheat = 1;
 	else
 		bbr->bbr_init_win_cheat = 0;
 	bbr->r_ctl.bbr_utter_max = bbr_hptsi_utter_max;
 	bbr->r_ctl.rc_drain_pg = bbr_drain_gain;
 	bbr->r_ctl.rc_startup_pg = bbr_high_gain;
 	bbr->rc_loss_exit = bbr_exit_startup_at_loss;
 	bbr->r_ctl.bbr_rttprobe_gain_val = bbr_rttprobe_gain;
 	bbr->r_ctl.bbr_hptsi_per_second = bbr_hptsi_per_second;
 	bbr->r_ctl.bbr_hptsi_segments_delay_tar = bbr_hptsi_segments_delay_tar;
 	bbr->r_ctl.bbr_hptsi_segments_max = bbr_hptsi_segments_max;
 	bbr->r_ctl.bbr_hptsi_segments_floor = bbr_hptsi_segments_floor;
 	bbr->r_ctl.bbr_hptsi_bytes_min = bbr_hptsi_bytes_min;
 	bbr->r_ctl.bbr_cross_over = bbr_cross_over;
 	bbr->r_ctl.rc_rtt_shrinks = cts;
 	if (bbr->rc_use_google) {
 		setup_time_filter(&bbr->r_ctl.rc_delrate,
 				  FILTER_TYPE_MAX,
 				  BBR_NUM_RTTS_FOR_GOOG_DEL_LIMIT);
 		setup_time_filter_small(&bbr->r_ctl.rc_rttprop,
 					FILTER_TYPE_MIN, (11 * USECS_IN_SECOND));
 	} else {
 		setup_time_filter(&bbr->r_ctl.rc_delrate,
 				  FILTER_TYPE_MAX,
 				  bbr_num_pktepo_for_del_limit);
 		setup_time_filter_small(&bbr->r_ctl.rc_rttprop,
 					FILTER_TYPE_MIN, (bbr_filter_len_sec * USECS_IN_SECOND));
 	}
 	bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_INIT, 0);
 	if (bbr_uses_idle_restart)
 		bbr->rc_use_idle_restart = 1;
 	else
 		bbr->rc_use_idle_restart = 0;
 	bbr->r_ctl.rc_bbr_cur_del_rate = 0;
 	bbr->r_ctl.rc_initial_hptsi_bw = bbr_initial_bw_bps;
 	if (bbr_resends_use_tso)
 		bbr->rc_resends_use_tso = 1;
 	if (tp->snd_una != tp->snd_max) {
 		/* Create a send map for the current outstanding data */
 		struct bbr_sendmap *rsm;
 
 		rsm = bbr_alloc(bbr);
 		if (rsm == NULL) {
 			uma_zfree(bbr_pcb_zone, *ptr);
 			*ptr = NULL;
 			return (ENOMEM);
 		}
 		rsm->r_rtt_not_allowed = 1;
 		rsm->r_tim_lastsent[0] = cts;
 		rsm->r_rtr_cnt = 1;
 		rsm->r_rtr_bytes = 0;
 		rsm->r_start = tp->snd_una;
 		rsm->r_end = tp->snd_max;
 		rsm->r_dupack = 0;
 		rsm->r_delivered = bbr->r_ctl.rc_delivered;
 		rsm->r_ts_valid = 0;
 		rsm->r_del_ack_ts = tp->ts_recent;
 		rsm->r_del_time = cts;
 		if (bbr->r_ctl.r_app_limited_until)
 			rsm->r_app_limited = 1;
 		else
 			rsm->r_app_limited = 0;
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_map, rsm, r_next);
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_tmap, rsm, r_tnext);
 		rsm->r_in_tmap = 1;
 		if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW)
 			rsm->r_bbr_state = bbr_state_val(bbr);
 		else
 			rsm->r_bbr_state = 8;
 	}
 	if (bbr_use_rack_resend_cheat && (bbr->rc_use_google == 0))
 		bbr->bbr_use_rack_cheat = 1;
 	if (bbr_incr_timers && (bbr->rc_use_google == 0))
 		bbr->r_ctl.rc_incr_tmrs = 1;
 	if (bbr_include_tcp_oh && (bbr->rc_use_google == 0))
 		bbr->r_ctl.rc_inc_tcp_oh = 1;
 	if (bbr_include_ip_oh && (bbr->rc_use_google == 0))
 		bbr->r_ctl.rc_inc_ip_oh = 1;
 	if (bbr_include_enet_oh && (bbr->rc_use_google == 0))
 		bbr->r_ctl.rc_inc_enet_oh = 1;
 
 	bbr_log_type_statechange(bbr, cts, __LINE__);
 	if (TCPS_HAVEESTABLISHED(tp->t_state) &&
 	    (tp->t_srtt)) {
 		uint32_t rtt;
 
 		rtt = (TICKS_2_USEC(tp->t_srtt) >> TCP_RTT_SHIFT);
 		apply_filter_min_small(&bbr->r_ctl.rc_rttprop, rtt, cts);
 	}
 	/* announce the settings and state */
 	bbr_log_settings_change(bbr, BBR_RECOVERY_LOWRTT);
 	tcp_bbr_tso_size_check(bbr, cts);
 	/*
 	 * Now call the generic function to start a timer. This will place
 	 * the TCB on the hptsi wheel if a timer is needed with appropriate
 	 * flags.
 	 */
 	bbr_stop_all_timers(tp, bbr);
 	/* 
 	 * Validate the timers are not in usec, if they are convert.
 	 * BBR should in theory move to USEC and get rid of a
 	 * lot of the TICKS_2 calls.. but for now we stay
 	 * with tick timers.
 	 */
 	tcp_change_time_units(tp, TCP_TMR_GRANULARITY_TICKS);
 	TCPT_RANGESET(tp->t_rxtcur,
 	    ((tp->t_srtt >> 2) + tp->t_rttvar) >> 1,
 	    tp->t_rttmin, TCPTV_REXMTMAX);
 	bbr_start_hpts_timer(bbr, tp, cts, 5, 0, 0);
 	return (0);
 }
 
 /*
  * Return 0 if we can accept the connection. Return
  * non-zero if we can't handle the connection. A EAGAIN
  * means you need to wait until the connection is up.
  * a EADDRNOTAVAIL means we can never handle the connection
  * (no SACK).
  */
 static int
 bbr_handoff_ok(struct tcpcb *tp)
 {
 	if ((tp->t_state == TCPS_CLOSED) ||
 	    (tp->t_state == TCPS_LISTEN)) {
 		/* Sure no problem though it may not stick */
 		return (0);
 	}
 	if ((tp->t_state == TCPS_SYN_SENT) ||
 	    (tp->t_state == TCPS_SYN_RECEIVED)) {
 		/*
 		 * We really don't know you have to get to ESTAB or beyond
 		 * to tell.
 		 */
 		return (EAGAIN);
 	}
 	if (tp->t_flags & TF_SENTFIN)
 		return (EINVAL);
 	if ((tp->t_flags & TF_SACK_PERMIT) || bbr_sack_not_required) {
 		return (0);
 	}
 	/*
 	 * If we reach here we don't do SACK on this connection so we can
 	 * never do rack.
 	 */
 	return (EINVAL);
 }
 
 static void
 bbr_fini(struct tcpcb *tp, int32_t tcb_is_purged)
 {
 	if (tp->t_fb_ptr) {
 		uint32_t calc;
 		struct tcp_bbr *bbr;
 		struct bbr_sendmap *rsm;
 
 		bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 		if (bbr->r_ctl.crte)
 			tcp_rel_pacing_rate(bbr->r_ctl.crte, bbr->rc_tp);
 		bbr_log_flowend(bbr);
 		bbr->rc_tp = NULL;
 		if (bbr->bbr_hdrw_pacing)
 			counter_u64_add(bbr_flows_whdwr_pacing, -1);
 		else
 			counter_u64_add(bbr_flows_nohdwr_pacing, -1);
 		if (bbr->r_ctl.crte != NULL) {
 			tcp_rel_pacing_rate(bbr->r_ctl.crte, tp);
 			bbr->r_ctl.crte = NULL;
 		}
 		rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 		while (rsm) {
 			TAILQ_REMOVE(&bbr->r_ctl.rc_map, rsm, r_next);
 			uma_zfree(bbr_zone, rsm);
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 		}
 		rsm = TAILQ_FIRST(&bbr->r_ctl.rc_free);
 		while (rsm) {
 			TAILQ_REMOVE(&bbr->r_ctl.rc_free, rsm, r_next);
 			uma_zfree(bbr_zone, rsm);
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_free);
 		}
 		calc = bbr->r_ctl.rc_high_rwnd - bbr->r_ctl.rc_init_rwnd;
 		if (calc > (bbr->r_ctl.rc_init_rwnd / 10))
 			BBR_STAT_INC(bbr_dynamic_rwnd);
 		else
 			BBR_STAT_INC(bbr_static_rwnd);
 		bbr->r_ctl.rc_free_cnt = 0;
 		uma_zfree(bbr_pcb_zone, tp->t_fb_ptr);
 		tp->t_fb_ptr = NULL;
 	}
 	/* Make sure snd_nxt is correctly set */
 	tp->snd_nxt = tp->snd_max;
 }
 
 static void
 bbr_set_state(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t win)
 {
 	switch (tp->t_state) {
 	case TCPS_SYN_SENT:
 		bbr->r_state = TCPS_SYN_SENT;
 		bbr->r_substate = bbr_do_syn_sent;
 		break;
 	case TCPS_SYN_RECEIVED:
 		bbr->r_state = TCPS_SYN_RECEIVED;
 		bbr->r_substate = bbr_do_syn_recv;
 		break;
 	case TCPS_ESTABLISHED:
 		bbr->r_ctl.rc_init_rwnd = max(win, bbr->rc_tp->snd_wnd);
 		bbr->r_state = TCPS_ESTABLISHED;
 		bbr->r_substate = bbr_do_established;
 		break;
 	case TCPS_CLOSE_WAIT:
 		bbr->r_state = TCPS_CLOSE_WAIT;
 		bbr->r_substate = bbr_do_close_wait;
 		break;
 	case TCPS_FIN_WAIT_1:
 		bbr->r_state = TCPS_FIN_WAIT_1;
 		bbr->r_substate = bbr_do_fin_wait_1;
 		break;
 	case TCPS_CLOSING:
 		bbr->r_state = TCPS_CLOSING;
 		bbr->r_substate = bbr_do_closing;
 		break;
 	case TCPS_LAST_ACK:
 		bbr->r_state = TCPS_LAST_ACK;
 		bbr->r_substate = bbr_do_lastack;
 		break;
 	case TCPS_FIN_WAIT_2:
 		bbr->r_state = TCPS_FIN_WAIT_2;
 		bbr->r_substate = bbr_do_fin_wait_2;
 		break;
 	case TCPS_LISTEN:
 	case TCPS_CLOSED:
 	case TCPS_TIME_WAIT:
 	default:
 		break;
 	};
 }
 
 static void
 bbr_substate_change(struct tcp_bbr *bbr, uint32_t cts, int32_t line, int dolog)
 {
 	/*
 	 * Now what state are we going into now? Is there adjustments
 	 * needed?
 	 */
 	int32_t old_state;
 
 	old_state = bbr_state_val(bbr);
 	if (bbr_state_val(bbr) == BBR_SUB_LEVEL1) {
 		/* Save the lowest srtt we saw in our end of the sub-state */
 		bbr->rc_hit_state_1 = 0;
 		if (bbr->r_ctl.bbr_smallest_srtt_this_state != 0xffffffff)
 			bbr->r_ctl.bbr_smallest_srtt_state2 = bbr->r_ctl.bbr_smallest_srtt_this_state;
 	}
 	bbr->rc_bbr_substate++;
 	if (bbr->rc_bbr_substate >= BBR_SUBSTATE_COUNT) {
 		/* Cycle back to first state-> gain */
 		bbr->rc_bbr_substate = 0;
 	}
 	if (bbr_state_val(bbr) == BBR_SUB_GAIN) {
 		/*
 		 * We enter the gain(5/4) cycle (possibly less if
 		 * shallow buffer detection is enabled)
 		 */
 		if (bbr->skip_gain) {
 			/*
 			 * Hardware pacing has set our rate to
 			 * the max and limited our b/w just
 			 * do level i.e. no gain.
 			 */
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr_hptsi_gain[BBR_SUB_LEVEL1];
 		} else if (bbr->gain_is_limited &&
 			   bbr->bbr_hdrw_pacing &&
 			   bbr->r_ctl.crte) {
 			/*
 			 * We can't gain above the hardware pacing
 			 * rate which is less than our rate + the gain
 			 * calculate the gain needed to reach the hardware
 			 * pacing rate..
 			 */
 			uint64_t bw, rate, gain_calc;
 
 			bw = bbr_get_bw(bbr);
 			rate = bbr->r_ctl.crte->rate;
 			if ((rate > bw) &&
 			    (((bw *  (uint64_t)bbr_hptsi_gain[BBR_SUB_GAIN]) / (uint64_t)BBR_UNIT) > rate)) {
 				gain_calc = (rate * BBR_UNIT) / bw;
 				if (gain_calc < BBR_UNIT)
 					gain_calc = BBR_UNIT;
 				bbr->r_ctl.rc_bbr_hptsi_gain = (uint16_t)gain_calc;
 			} else {
 				bbr->r_ctl.rc_bbr_hptsi_gain = bbr_hptsi_gain[BBR_SUB_GAIN];
 			}
 		} else
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr_hptsi_gain[BBR_SUB_GAIN];
 		if ((bbr->rc_use_google == 0) && (bbr_gain_to_target == 0)) {
 			bbr->r_ctl.rc_bbr_state_atflight = cts;
 		} else
 			bbr->r_ctl.rc_bbr_state_atflight = 0;
 	} else if (bbr_state_val(bbr) == BBR_SUB_DRAIN) {
 		bbr->rc_hit_state_1 = 1;
 		bbr->r_ctl.rc_exta_time_gd = 0;
 		bbr->r_ctl.flightsize_at_drain = ctf_flight_size(bbr->rc_tp,
 						     (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		if (bbr_state_drain_2_tar) {
 			bbr->r_ctl.rc_bbr_state_atflight = 0;
 		} else
 			bbr->r_ctl.rc_bbr_state_atflight = cts;
 		bbr->r_ctl.rc_bbr_hptsi_gain = bbr_hptsi_gain[BBR_SUB_DRAIN];
 	} else {
 		/* All other cycles hit here 2-7 */
 		if ((old_state == BBR_SUB_DRAIN) && bbr->rc_hit_state_1) {
 			if (bbr_sub_drain_slam_cwnd &&
 			    (bbr->rc_use_google == 0) &&
 			    (bbr->rc_tp->snd_cwnd < bbr->r_ctl.rc_saved_cwnd)) {
 				bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_saved_cwnd;
 				bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 			}
 			if ((cts - bbr->r_ctl.rc_bbr_state_time) > bbr_get_rtt(bbr, BBR_RTT_PROP))
 				bbr->r_ctl.rc_exta_time_gd += ((cts - bbr->r_ctl.rc_bbr_state_time) -
 							       bbr_get_rtt(bbr, BBR_RTT_PROP));
 			else
 				bbr->r_ctl.rc_exta_time_gd = 0;
 			if (bbr->r_ctl.rc_exta_time_gd) {
 				bbr->r_ctl.rc_level_state_extra = bbr->r_ctl.rc_exta_time_gd;
 				/* Now chop up the time for each state (div by 7) */
 				bbr->r_ctl.rc_level_state_extra /= 7;
 				if (bbr_rand_ot && bbr->r_ctl.rc_level_state_extra) {
 					/* Add a randomization */
 					bbr_randomize_extra_state_time(bbr);
 				}
 			}
 		}
 		bbr->r_ctl.rc_bbr_state_atflight = max(1, cts);
 		bbr->r_ctl.rc_bbr_hptsi_gain = bbr_hptsi_gain[bbr_state_val(bbr)];
 	}
 	if (bbr->rc_use_google) {
 		bbr->r_ctl.rc_bbr_state_atflight = max(1, cts);
 	}
 	bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 	bbr->r_ctl.rc_bbr_cwnd_gain = bbr_cwnd_gain;
 	if (dolog)
 		bbr_log_type_statechange(bbr, cts, line);
 
 	if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 		uint32_t time_in;
 
 		time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 		if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW) {
 			counter_u64_add(bbr_state_time[(old_state + 5)], time_in);
 		} else {
 			counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 		}
 	}
 	bbr->r_ctl.bbr_smallest_srtt_this_state = 0xffffffff;
 	bbr_set_state_target(bbr, __LINE__);
 	if (bbr_sub_drain_slam_cwnd &&
 	    (bbr->rc_use_google == 0) &&
 	    (bbr_state_val(bbr) == BBR_SUB_DRAIN)) {
 		/* Slam down the cwnd */
 		bbr->r_ctl.rc_saved_cwnd = bbr->rc_tp->snd_cwnd;
 		bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 		if (bbr_sub_drain_app_limit) {
 			/* Go app limited if we are on a long drain */
 			bbr->r_ctl.r_app_limited_until = (bbr->r_ctl.rc_delivered +
 							  ctf_flight_size(bbr->rc_tp,
 							      (bbr->r_ctl.rc_sacked +
 							       bbr->r_ctl.rc_lost_bytes)));
 		}
 		bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 	}
 	if (bbr->rc_lt_use_bw) {
 		/* In policed mode we clamp pacing_gain to BBR_UNIT */
 		bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 	}
 	/* Google changes TSO size every cycle */
 	if (bbr->rc_use_google)
 		tcp_bbr_tso_size_check(bbr, cts);
 	bbr->r_ctl.gain_epoch = cts;
 	bbr->r_ctl.rc_bbr_state_time = cts;
 	bbr->r_ctl.substate_pe = bbr->r_ctl.rc_pkt_epoch;
 }
 
 static void
 bbr_set_probebw_google_gains(struct tcp_bbr *bbr, uint32_t cts, uint32_t losses)
 {
 	if ((bbr_state_val(bbr) == BBR_SUB_DRAIN) &&
 	    (google_allow_early_out == 1) &&
 	    (bbr->r_ctl.rc_flight_at_input <= bbr->r_ctl.rc_target_at_state)) {
 		/* We have reached out target flight size possibly early */
 		goto change_state;
 	}
 	if (TSTMP_LT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 		return;
 	}
 	if ((cts - bbr->r_ctl.rc_bbr_state_time) < bbr_get_rtt(bbr, BBR_RTT_PROP)) {
 		/*
 		 * Must be a rttProp movement forward before
 		 * we can change states.
 		 */
 		return;
 	}
 	if (bbr_state_val(bbr) == BBR_SUB_GAIN) {
 		/*
 		 * The needed time has passed but for
 		 * the gain cycle extra rules apply:
 		 * 1) If we have seen loss, we exit
 		 * 2) If we have not reached the target
 		 *    we stay in GAIN (gain-to-target).
 		 */
 		if (google_consider_lost && losses)
 			goto change_state;
 		if (bbr->r_ctl.rc_target_at_state > bbr->r_ctl.rc_flight_at_input) {
 			return;
 		}
 	}
 change_state:
 	/* For gain we must reach our target, all others last 1 rttProp */
 	bbr_substate_change(bbr, cts, __LINE__, 1);
 }
 
 static void
 bbr_set_probebw_gains(struct tcp_bbr *bbr, uint32_t cts, uint32_t losses)
 {
 	uint32_t flight, bbr_cur_cycle_time;
 
 	if (bbr->rc_use_google) {
 		bbr_set_probebw_google_gains(bbr, cts, losses);
 		return;
 	}
 	if (cts == 0) {
 		/*
 		 * Never alow cts to be 0 we
 		 * do this so we can judge if
 		 * we have set a timestamp.
 		 */
 		cts = 1;
 	}
 	if (bbr_state_is_pkt_epoch)
 		bbr_cur_cycle_time = bbr_get_rtt(bbr, BBR_RTT_PKTRTT);
 	else
 		bbr_cur_cycle_time = bbr_get_rtt(bbr, BBR_RTT_PROP);
 
 	if (bbr->r_ctl.rc_bbr_state_atflight == 0) {
 		if (bbr_state_val(bbr) == BBR_SUB_DRAIN) {
 			flight = ctf_flight_size(bbr->rc_tp,
 				     (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 			if (bbr_sub_drain_slam_cwnd && bbr->rc_hit_state_1) {
 				/* Keep it slam down */
 				if (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_target_at_state) {
 					bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 					bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 				}
 				if (bbr_sub_drain_app_limit) {
 					/* Go app limited if we are on a long drain */
 					bbr->r_ctl.r_app_limited_until = (bbr->r_ctl.rc_delivered + flight);
 				}
 			}
 			if (TSTMP_GT(cts, bbr->r_ctl.gain_epoch) &&
 			    (((cts - bbr->r_ctl.gain_epoch) > bbr_get_rtt(bbr, BBR_RTT_PROP)) ||
 			     (flight >= bbr->r_ctl.flightsize_at_drain))) {
 				/*
 				 * Still here after the same time as
 				 * the gain. We need to drain harder
 				 * for the next srtt. Reduce by a set amount
 				 * the gain drop is capped at DRAIN states
 				 * value (88).
 				 */
 				bbr->r_ctl.flightsize_at_drain = flight;
 				if (bbr_drain_drop_mul &&
 				    bbr_drain_drop_div &&
 				    (bbr_drain_drop_mul < bbr_drain_drop_div)) {
 					/* Use your specific drop value (def 4/5 = 20%) */
 					bbr->r_ctl.rc_bbr_hptsi_gain *= bbr_drain_drop_mul;
 					bbr->r_ctl.rc_bbr_hptsi_gain /= bbr_drain_drop_div;
 				} else {
 					/* You get drop of 20% */
 					bbr->r_ctl.rc_bbr_hptsi_gain *= 4;
 					bbr->r_ctl.rc_bbr_hptsi_gain /= 5;
 				}
 				if (bbr->r_ctl.rc_bbr_hptsi_gain <= bbr_drain_floor) {
 					/* Reduce our gain again to the bottom  */
 					bbr->r_ctl.rc_bbr_hptsi_gain = max(bbr_drain_floor, 1);
 				}
 				bbr_log_exit_gain(bbr, cts, 4);
 				/*
 				 * Extend out so we wait another
 				 * epoch before dropping again.
 				 */
 				bbr->r_ctl.gain_epoch = cts;
 			}
 			if (flight <= bbr->r_ctl.rc_target_at_state) {
 				if (bbr_sub_drain_slam_cwnd &&
 				    (bbr->rc_use_google == 0) &&
 				    (bbr->rc_tp->snd_cwnd < bbr->r_ctl.rc_saved_cwnd)) {
 					bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_saved_cwnd;
 					bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 				}
 				bbr->r_ctl.rc_bbr_state_atflight = max(cts, 1);
 				bbr_log_exit_gain(bbr, cts, 3);
 			}
 		} else {
 			/* Its a gain  */
 			if (bbr->r_ctl.rc_lost > bbr->r_ctl.bbr_lost_at_state) {
 				bbr->r_ctl.rc_bbr_state_atflight = max(cts, 1);
 				goto change_state;
 			}
 			if ((ctf_outstanding(bbr->rc_tp) >= bbr->r_ctl.rc_target_at_state) ||
 			    ((ctf_outstanding(bbr->rc_tp) +  bbr->rc_tp->t_maxseg - 1) >=
 			     bbr->rc_tp->snd_wnd)) {
 				bbr->r_ctl.rc_bbr_state_atflight = max(cts, 1);
 				bbr_log_exit_gain(bbr, cts, 2);
 			}
 		}
 		/**
 		 * We fall through and return always one of two things has
 		 * occurred.
 		 * 1) We are still not at target
 		 *    <or>
 		 * 2) We reached the target and set rc_bbr_state_atflight
 		 *    which means we no longer hit this block
 		 *    next time we are called.
 		 */
 		return;
 	}
 change_state:
 	if (TSTMP_LT(cts, bbr->r_ctl.rc_bbr_state_time))
 		return;
 	if ((cts - bbr->r_ctl.rc_bbr_state_time) < bbr_cur_cycle_time) {
 		/* Less than a full time-period has passed */
 		return;
 	}
 	if (bbr->r_ctl.rc_level_state_extra &&
 	    (bbr_state_val(bbr) > BBR_SUB_DRAIN) &&
 	    ((cts - bbr->r_ctl.rc_bbr_state_time) <
 	     (bbr_cur_cycle_time + bbr->r_ctl.rc_level_state_extra))) {
 		/* Less than a full time-period + extra has passed */
 		return;
 	}
 	if (bbr_gain_gets_extra_too &&
 	    bbr->r_ctl.rc_level_state_extra &&
 	    (bbr_state_val(bbr) == BBR_SUB_GAIN) &&
 	    ((cts - bbr->r_ctl.rc_bbr_state_time) <
 	     (bbr_cur_cycle_time + bbr->r_ctl.rc_level_state_extra))) {
 		/* Less than a full time-period + extra has passed */
 		return;
 	}
 	bbr_substate_change(bbr, cts, __LINE__, 1);
 }
 
 static uint32_t
 bbr_get_a_state_target(struct tcp_bbr *bbr, uint32_t gain)
 {
 	uint32_t mss, tar;
 
 	if (bbr->rc_use_google) {
 		/* Google just uses the cwnd target */
 		tar = bbr_get_target_cwnd(bbr, bbr_get_bw(bbr), gain);
 	} else {
 		mss = min((bbr->rc_tp->t_maxseg - bbr->rc_last_options),
 			  bbr->r_ctl.rc_pace_max_segs);
 		/* Get the base cwnd with gain rounded to a mss */
 		tar = roundup(bbr_get_raw_target_cwnd(bbr, bbr_get_bw(bbr),
 						      gain), mss);
 		/* Make sure it is within our min */
 		if (tar < get_min_cwnd(bbr))
 			return (get_min_cwnd(bbr));
 	}
 	return (tar);
 }
 
 static void
 bbr_set_state_target(struct tcp_bbr *bbr, int line)
 {
 	uint32_t tar, meth;
 
 	if ((bbr->rc_bbr_state == BBR_STATE_PROBE_RTT) &&
 	    ((bbr->r_ctl.bbr_rttprobe_gain_val == 0) || bbr->rc_use_google)) {
 		/* Special case using old probe-rtt method */
 		tar = bbr_rtt_probe_cwndtarg * (bbr->rc_tp->t_maxseg - bbr->rc_last_options);
 		meth = 1;
 	} else {
 		/* Non-probe-rtt case and reduced probe-rtt  */
 		if ((bbr->rc_bbr_state == BBR_STATE_PROBE_BW) &&
 		    (bbr->r_ctl.rc_bbr_hptsi_gain > BBR_UNIT)) {
 			/* For gain cycle we use the hptsi gain */
 			tar = bbr_get_a_state_target(bbr, bbr->r_ctl.rc_bbr_hptsi_gain);
 			meth = 2;
 		} else if ((bbr_target_is_bbunit) || bbr->rc_use_google) {
 			/*
 			 * If configured, or for google all other states
 			 * get BBR_UNIT.
 			 */
 			tar = bbr_get_a_state_target(bbr, BBR_UNIT);
 			meth = 3;
 		} else {
 			/*
 			 * Or we set a target based on the pacing gain
 			 * for non-google mode and default (non-configured).
 			 * Note we don't set a target goal below drain (192).
 			 */
 			if (bbr->r_ctl.rc_bbr_hptsi_gain < bbr_hptsi_gain[BBR_SUB_DRAIN])  {
 				tar = bbr_get_a_state_target(bbr, bbr_hptsi_gain[BBR_SUB_DRAIN]);
 				meth = 4;
 			} else {
 				tar = bbr_get_a_state_target(bbr, bbr->r_ctl.rc_bbr_hptsi_gain);
 				meth = 5;
 			}
 		}
 	}
 	bbr_log_set_of_state_target(bbr, tar, line, meth);
 	bbr->r_ctl.rc_target_at_state = tar;
 }
 
 static void
 bbr_enter_probe_rtt(struct tcp_bbr *bbr, uint32_t cts, int32_t line)
 {
 	/* Change to probe_rtt */
 	uint32_t time_in;
 
 	bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 	bbr->r_ctl.flightsize_at_drain = ctf_flight_size(bbr->rc_tp,
 					     (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 	bbr->r_ctl.r_app_limited_until = (bbr->r_ctl.flightsize_at_drain
 					  + bbr->r_ctl.rc_delivered);
 	/* Setup so we force feed the filter */
 	if (bbr->rc_use_google || bbr_probertt_sets_rtt)
 		bbr->rc_prtt_set_ts = 1;
 	if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 		time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 		counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 	}
 	bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_ENTERPROBE, 0);
 	bbr->r_ctl.rc_rtt_shrinks = cts;
 	bbr->r_ctl.last_in_probertt = cts;
 	bbr->r_ctl.rc_probertt_srttchktim = cts;
 	bbr->r_ctl.rc_bbr_state_time = cts;
 	bbr->rc_bbr_state = BBR_STATE_PROBE_RTT;
 	/* We need to force the filter to update */
 
 	if ((bbr_sub_drain_slam_cwnd) &&
 	    bbr->rc_hit_state_1 &&
 	    (bbr->rc_use_google == 0) &&
 	    (bbr_state_val(bbr) == BBR_SUB_DRAIN)) {
 		if (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_saved_cwnd)
 			bbr->r_ctl.rc_saved_cwnd = bbr->rc_tp->snd_cwnd;
 	} else
 		bbr->r_ctl.rc_saved_cwnd = bbr->rc_tp->snd_cwnd;
 	/* Update the lost */
 	bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 	if ((bbr->r_ctl.bbr_rttprobe_gain_val == 0) || bbr->rc_use_google){
 		/* Set to the non-configurable default of 4 (PROBE_RTT_MIN)  */
 		bbr->rc_tp->snd_cwnd = bbr_rtt_probe_cwndtarg * (bbr->rc_tp->t_maxseg - bbr->rc_last_options);
 		bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 		bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 		bbr->r_ctl.rc_bbr_cwnd_gain = BBR_UNIT;
 		bbr_log_set_of_state_target(bbr, bbr->rc_tp->snd_cwnd, __LINE__, 6);
 		bbr->r_ctl.rc_target_at_state = bbr->rc_tp->snd_cwnd;
 	} else {
 		/*
 		 * We bring it down slowly by using a hptsi gain that is
 		 * probably 75%. This will slowly float down our outstanding
 		 * without tampering with the cwnd.
 		 */
 		bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.bbr_rttprobe_gain_val;
 		bbr->r_ctl.rc_bbr_cwnd_gain = BBR_UNIT;
 		bbr_set_state_target(bbr, __LINE__);
 		if (bbr_prtt_slam_cwnd &&
 		    (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_target_at_state)) {
 			bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 		}
 	}
 	if (ctf_flight_size(bbr->rc_tp,
 		(bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) <=
 	    bbr->r_ctl.rc_target_at_state) {
 		/* We are at target */
 		bbr->r_ctl.rc_bbr_enters_probertt = cts;
 	} else {
 		/* We need to come down to reach target before our time begins */
 		bbr->r_ctl.rc_bbr_enters_probertt = 0;
 	}
 	bbr->r_ctl.rc_pe_of_prtt = bbr->r_ctl.rc_pkt_epoch;
 	BBR_STAT_INC(bbr_enter_probertt);
 	bbr_log_exit_gain(bbr, cts, 0);
 	bbr_log_type_statechange(bbr, cts, line);
 }
 
 static void
 bbr_check_probe_rtt_limits(struct tcp_bbr *bbr, uint32_t cts)
 {
 	/*
 	 * Sanity check on probe-rtt intervals.
 	 * In crazy situations where we are competing
 	 * against new-reno flows with huge buffers
 	 * our rtt-prop interval could come to dominate
 	 * things if we can't get through a full set
 	 * of cycles, we need to adjust it.
 	 */
 	if (bbr_can_adjust_probertt &&
 	    (bbr->rc_use_google == 0)) {
 		uint16_t val = 0;
 		uint32_t cur_rttp, fval, newval, baseval;
 
 		/* Are we to small and go into probe-rtt to often? */
 		baseval = (bbr_get_rtt(bbr, BBR_RTT_PROP) * (BBR_SUBSTATE_COUNT + 1));
 		cur_rttp = roundup(baseval, USECS_IN_SECOND);
 		fval = bbr_filter_len_sec * USECS_IN_SECOND;
 		if (bbr_is_ratio == 0) {
 			if (fval > bbr_rtt_probe_limit)
 				newval = cur_rttp + (fval - bbr_rtt_probe_limit);
 			else
 				newval = cur_rttp;
 		} else {
 			int mul;
 
 			mul = fval / bbr_rtt_probe_limit;
 			newval = cur_rttp * mul;
 		}
 		if (cur_rttp > 	bbr->r_ctl.rc_probertt_int) {
 			bbr->r_ctl.rc_probertt_int = cur_rttp;
 			reset_time_small(&bbr->r_ctl.rc_rttprop, newval);
 			val = 1;
 		} else {
 			/*
 			 * No adjustments were made
 			 * do we need to shrink it?
 			 */
 			if (bbr->r_ctl.rc_probertt_int > bbr_rtt_probe_limit) {
 				if (cur_rttp <= bbr_rtt_probe_limit) {
 					/*
 					 * Things have calmed down lets
 					 * shrink all the way to default
 					 */
 					bbr->r_ctl.rc_probertt_int = bbr_rtt_probe_limit;
 					reset_time_small(&bbr->r_ctl.rc_rttprop,
 							 (bbr_filter_len_sec * USECS_IN_SECOND));
 					cur_rttp = bbr_rtt_probe_limit;
 					newval = (bbr_filter_len_sec * USECS_IN_SECOND);
 					val = 2;
 				} else {
 					/*
 					 * Well does some adjustment make sense?
 					 */
 					if (cur_rttp < bbr->r_ctl.rc_probertt_int) {
 						/* We can reduce interval time some */
 						bbr->r_ctl.rc_probertt_int = cur_rttp;
 						reset_time_small(&bbr->r_ctl.rc_rttprop, newval);
 						val = 3;
 					}
 				}
 			}
 		}
 		if (val)
 			bbr_log_rtt_shrinks(bbr, cts, cur_rttp, newval, __LINE__, BBR_RTTS_RESETS_VALUES, val);
 	}
 }
 
 static void
 bbr_exit_probe_rtt(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t cts)
 {
 	/* Exit probe-rtt */
 
 	if (tp->snd_cwnd < bbr->r_ctl.rc_saved_cwnd) {
 		tp->snd_cwnd = bbr->r_ctl.rc_saved_cwnd;
 		bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 	}
 	bbr_log_exit_gain(bbr, cts, 1);
 	bbr->rc_hit_state_1 = 0;
 	bbr->r_ctl.rc_rtt_shrinks = cts;
 	bbr->r_ctl.last_in_probertt = cts;
 	bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_RTTPROBE, 0);
 	bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 	bbr->r_ctl.r_app_limited_until = (ctf_flight_size(tp,
 					      (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) +
 					  bbr->r_ctl.rc_delivered);
 	if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 		uint32_t time_in;
 
 		time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 		counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 	}
 	if (bbr->rc_filled_pipe) {
 		/* Switch to probe_bw */
 		bbr->rc_bbr_state = BBR_STATE_PROBE_BW;
 		bbr->rc_bbr_substate = bbr_pick_probebw_substate(bbr, cts);
 		bbr->r_ctl.rc_bbr_cwnd_gain = bbr_cwnd_gain;
 		bbr_substate_change(bbr, cts, __LINE__, 0);
 		bbr_log_type_statechange(bbr, cts, __LINE__);
 	} else {
 		/* Back to startup */
 		bbr->rc_bbr_state = BBR_STATE_STARTUP;
 		bbr->r_ctl.rc_bbr_state_time = cts;
 		/*
 		 * We don't want to give a complete free 3
 		 * measurements until we exit, so we use
 		 * the number of pe's we were in probe-rtt
 		 * to add to the startup_epoch. That way
 		 * we will still retain the old state.
 		 */
 		bbr->r_ctl.rc_bbr_last_startup_epoch += (bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_pe_of_prtt);
 		bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 		/* Make sure to use the lower pg when shifting back in */
 		if (bbr->r_ctl.rc_lost &&
 		    bbr_use_lower_gain_in_startup &&
 		    (bbr->rc_use_google == 0))
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr_startup_lower;
 		else
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.rc_startup_pg;
 		bbr->r_ctl.rc_bbr_cwnd_gain = bbr->r_ctl.rc_startup_pg;
 		/* Probably not needed but set it anyway */
 		bbr_set_state_target(bbr, __LINE__);
 		bbr_log_type_statechange(bbr, cts, __LINE__);
 		bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 		    bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 0);
 	}
 	bbr_check_probe_rtt_limits(bbr, cts);
 }
 
 static int32_t inline
 bbr_should_enter_probe_rtt(struct tcp_bbr *bbr, uint32_t cts)
 {
 	if ((bbr->rc_past_init_win == 1) &&
 	    (bbr->rc_in_persist == 0) &&
 	    (bbr_calc_time(cts, bbr->r_ctl.rc_rtt_shrinks) >= bbr->r_ctl.rc_probertt_int)) {
 		return (1);
 	}
 	if (bbr_can_force_probertt &&
 	    (bbr->rc_in_persist == 0) &&
 	    (TSTMP_GT(cts, bbr->r_ctl.last_in_probertt)) &&
 	    ((cts - bbr->r_ctl.last_in_probertt) > bbr->r_ctl.rc_probertt_int)) {
 		return (1);
 	}
 	return (0);
 }
 
 static int32_t
 bbr_google_startup(struct tcp_bbr *bbr, uint32_t cts, int32_t  pkt_epoch)
 {
 	uint64_t btlbw, gain;
 	if (pkt_epoch == 0) {
 		/*
 		 * Need to be on a pkt-epoch to continue.
 		 */
 		return (0);
 	}
 	btlbw = bbr_get_full_bw(bbr);
 	gain = ((bbr->r_ctl.rc_bbr_lastbtlbw *
 		 (uint64_t)bbr_start_exit) / (uint64_t)100) + bbr->r_ctl.rc_bbr_lastbtlbw;
 	if (btlbw >= gain) {
 		bbr->r_ctl.rc_bbr_last_startup_epoch = bbr->r_ctl.rc_pkt_epoch;
 		bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 				      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 3);
 		bbr->r_ctl.rc_bbr_lastbtlbw = btlbw;
 	}
 	if ((bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_bbr_last_startup_epoch) >= BBR_STARTUP_EPOCHS)
 		return (1);
 	bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 			      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 8);
 	return(0);
 }
 
 static int32_t inline
 bbr_state_startup(struct tcp_bbr *bbr, uint32_t cts, int32_t epoch, int32_t pkt_epoch)
 {
 	/* Have we gained 25% in the last 3 packet based epoch's? */
 	uint64_t btlbw, gain;
 	int do_exit;
 	int delta, rtt_gain;
 
 	if ((bbr->rc_tp->snd_una == bbr->rc_tp->snd_max) &&
 	    (bbr_calc_time(cts, bbr->r_ctl.rc_went_idle_time) >= bbr_rtt_probe_time)) {
 		/*
 		 * This qualifies as a RTT_PROBE session since we drop the
 		 * data outstanding to nothing and waited more than
 		 * bbr_rtt_probe_time.
 		 */
 		bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_WASIDLE, 0);
 		bbr_set_reduced_rtt(bbr, cts, __LINE__);
 	}
 	if (bbr_should_enter_probe_rtt(bbr, cts)) {
 		bbr_enter_probe_rtt(bbr, cts, __LINE__);
 		return (0);
 	}
 	if (bbr->rc_use_google)
 		return (bbr_google_startup(bbr, cts,  pkt_epoch));
 
 	if ((bbr->r_ctl.rc_lost > bbr->r_ctl.rc_lost_at_startup) &&
 	    (bbr_use_lower_gain_in_startup)) {
 		/* Drop to a lower gain 1.5 x since we saw loss */
 		bbr->r_ctl.rc_bbr_hptsi_gain = bbr_startup_lower;
 	}
 	if (pkt_epoch == 0) {
 		/*
 		 * Need to be on a pkt-epoch to continue.
 		 */
 		return (0);
 	}
 	if (bbr_rtt_gain_thresh) {
 		/*
 		 * Do we allow a flow to stay
 		 * in startup with no loss and no
 		 * gain in rtt over a set threshold?
 		 */
 		if (bbr->r_ctl.rc_pkt_epoch_rtt &&
 		    bbr->r_ctl.startup_last_srtt &&
 		    (bbr->r_ctl.rc_pkt_epoch_rtt > bbr->r_ctl.startup_last_srtt)) {
 			delta = bbr->r_ctl.rc_pkt_epoch_rtt - bbr->r_ctl.startup_last_srtt;
 			rtt_gain = (delta * 100) / bbr->r_ctl.startup_last_srtt;
 		} else
 			rtt_gain = 0;
 		if ((bbr->r_ctl.startup_last_srtt == 0)  ||
 		    (bbr->r_ctl.rc_pkt_epoch_rtt < bbr->r_ctl.startup_last_srtt))
 			/* First time or new lower value */
 			bbr->r_ctl.startup_last_srtt = bbr->r_ctl.rc_pkt_epoch_rtt;
 
 		if ((bbr->r_ctl.rc_lost == 0) &&
 		    (rtt_gain < bbr_rtt_gain_thresh)) {
 			/*
 			 * No loss, and we are under
 			 * our gain threhold for
 			 * increasing RTT.
 			 */
 			if (bbr->r_ctl.rc_bbr_last_startup_epoch < bbr->r_ctl.rc_pkt_epoch)
 				bbr->r_ctl.rc_bbr_last_startup_epoch++;
 			bbr_log_startup_event(bbr, cts, rtt_gain,
 					      delta, bbr->r_ctl.startup_last_srtt, 10);
 			return (0);
 		}
 	}
 	if ((bbr->r_ctl.r_measurement_count == bbr->r_ctl.last_startup_measure) &&
 	    (bbr->r_ctl.rc_lost_at_startup == bbr->r_ctl.rc_lost) &&
 	    (!IN_RECOVERY(bbr->rc_tp->t_flags))) {
 		/*
 		 * We only assess if we have a new measurement when
 		 * we have no loss and are not in recovery.
 		 * Drag up by one our last_startup epoch so we will hold
 		 * the number of non-gain we have already accumulated.
 		 */
 		if (bbr->r_ctl.rc_bbr_last_startup_epoch < bbr->r_ctl.rc_pkt_epoch)
 			bbr->r_ctl.rc_bbr_last_startup_epoch++;
 		bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 				      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 9);
 		return (0);
 	}
 	/* Case where we reduced the lost (bad retransmit) */
 	if (bbr->r_ctl.rc_lost_at_startup > bbr->r_ctl.rc_lost)
 		bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 	bbr->r_ctl.last_startup_measure = bbr->r_ctl.r_measurement_count;
 	btlbw = bbr_get_full_bw(bbr);
 	if (bbr->r_ctl.rc_bbr_hptsi_gain == bbr_startup_lower)
 		gain = ((bbr->r_ctl.rc_bbr_lastbtlbw *
 			 (uint64_t)bbr_low_start_exit) / (uint64_t)100) + bbr->r_ctl.rc_bbr_lastbtlbw;
 	else
 		gain = ((bbr->r_ctl.rc_bbr_lastbtlbw *
 			 (uint64_t)bbr_start_exit) / (uint64_t)100) + bbr->r_ctl.rc_bbr_lastbtlbw;
 	do_exit = 0;
 	if (btlbw > bbr->r_ctl.rc_bbr_lastbtlbw)
 		bbr->r_ctl.rc_bbr_lastbtlbw = btlbw;
 	if (btlbw >= gain) {
 		bbr->r_ctl.rc_bbr_last_startup_epoch = bbr->r_ctl.rc_pkt_epoch;
 		/* Update the lost so we won't exit in next set of tests */
 		bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 		bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 				      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 3);
 	}
 	if ((bbr->rc_loss_exit &&
 	     (bbr->r_ctl.rc_lost > bbr->r_ctl.rc_lost_at_startup) &&
 	     (bbr->r_ctl.rc_pkt_epoch_loss_rate > bbr_startup_loss_thresh)) &&
 	    ((bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_bbr_last_startup_epoch) >= BBR_STARTUP_EPOCHS)) {
 		/*
 		 * If we had no gain,  we had loss and that loss was above
 		 * our threshould, the rwnd is not constrained, and we have
 		 * had at least 3 packet epochs exit. Note that this is
 		 * switched off by sysctl. Google does not do this by the
 		 * way.
 		 */
 		if ((ctf_flight_size(bbr->rc_tp,
 			 (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) +
 		     (2 * max(bbr->r_ctl.rc_pace_max_segs, bbr->rc_tp->t_maxseg))) <= bbr->rc_tp->snd_wnd) {
 			do_exit = 1;
 			bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 					      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 4);
 		} else {
 			/* Just record an updated loss value */
 			bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 			bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 					      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 5);
 		}
 	} else
 		bbr->r_ctl.rc_lost_at_startup = bbr->r_ctl.rc_lost;
 	if (((bbr->r_ctl.rc_pkt_epoch - bbr->r_ctl.rc_bbr_last_startup_epoch) >= BBR_STARTUP_EPOCHS) ||
 	    do_exit) {
 		/* Return 1 to exit the startup state. */
 		return (1);
 	}
 	/* Stay in startup */
 	bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 			      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 8);
 	return (0);
 }
 
 static void
 bbr_state_change(struct tcp_bbr *bbr, uint32_t cts, int32_t epoch, int32_t pkt_epoch, uint32_t losses)
 {
 	/*
 	 * A tick occurred in the rtt epoch do we need to do anything?
 	 */
 #ifdef BBR_INVARIANTS
 	if ((bbr->rc_bbr_state != BBR_STATE_STARTUP) &&
 	    (bbr->rc_bbr_state != BBR_STATE_DRAIN) &&
 	    (bbr->rc_bbr_state != BBR_STATE_PROBE_RTT) &&
 	    (bbr->rc_bbr_state != BBR_STATE_IDLE_EXIT) &&
 	    (bbr->rc_bbr_state != BBR_STATE_PROBE_BW)) {
 		/* Debug code? */
 		panic("Unknown BBR state %d?\n", bbr->rc_bbr_state);
 	}
 #endif
 	if (bbr->rc_bbr_state == BBR_STATE_STARTUP) {
 		/* Do we exit the startup state? */
 		if (bbr_state_startup(bbr, cts, epoch, pkt_epoch)) {
 			uint32_t time_in;
 
 			bbr_log_startup_event(bbr, cts, bbr->r_ctl.rc_bbr_last_startup_epoch,
 					      bbr->r_ctl.rc_lost_at_startup, bbr_start_exit, 6);
 			bbr->rc_filled_pipe = 1;
 			bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 			if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 				time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 				counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 			} else
 				time_in = 0;
 			if (bbr->rc_no_pacing)
 				bbr->rc_no_pacing = 0;
 			bbr->r_ctl.rc_bbr_state_time = cts;
 			bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.rc_drain_pg;
 			bbr->rc_bbr_state = BBR_STATE_DRAIN;
 			bbr_set_state_target(bbr, __LINE__);
 			if ((bbr->rc_use_google == 0) &&
 			    bbr_slam_cwnd_in_main_drain) {
 				/* Here we don't have to worry about probe-rtt */
 				bbr->r_ctl.rc_saved_cwnd = bbr->rc_tp->snd_cwnd;
 				bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 				bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 			}
 			bbr->r_ctl.rc_bbr_cwnd_gain = bbr_high_gain;
 			bbr_log_type_statechange(bbr, cts, __LINE__);
 			if (ctf_flight_size(bbr->rc_tp,
 			        (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes)) <=
 			    bbr->r_ctl.rc_target_at_state) {
 				/*
 				 * Switch to probe_bw if we are already
 				 * there
 				 */
 				bbr->rc_bbr_substate = bbr_pick_probebw_substate(bbr, cts);
 				bbr_substate_change(bbr, cts, __LINE__, 0);
 				bbr->rc_bbr_state = BBR_STATE_PROBE_BW;
 				bbr_log_type_statechange(bbr, cts, __LINE__);
 			}
 		}
 	} else if (bbr->rc_bbr_state == BBR_STATE_IDLE_EXIT) {
 		uint32_t inflight;
 		struct tcpcb *tp;
 
 		tp = bbr->rc_tp;
 		inflight = ctf_flight_size(tp,
 			      (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		if (inflight >= bbr->r_ctl.rc_target_at_state) {
 			/* We have reached a flight of the cwnd target */
 			bbr->rc_bbr_state = BBR_STATE_PROBE_BW;
 			bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 			bbr->r_ctl.rc_bbr_cwnd_gain = BBR_UNIT;
 			bbr_set_state_target(bbr, __LINE__);
 			/*
 			 * Rig it so we don't do anything crazy and
 			 * start fresh with a new randomization.
 			 */
 			bbr->r_ctl.bbr_smallest_srtt_this_state = 0xffffffff;
 			bbr->rc_bbr_substate = BBR_SUB_LEVEL6;
 			bbr_substate_change(bbr, cts, __LINE__, 1);
 		}
 	} else if (bbr->rc_bbr_state == BBR_STATE_DRAIN) {
 		/* Has in-flight reached the bdp (or less)? */
 		uint32_t inflight;
 		struct tcpcb *tp;
 
 		tp = bbr->rc_tp;
 		inflight = ctf_flight_size(tp,
 			      (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		if ((bbr->rc_use_google == 0) &&
 		    bbr_slam_cwnd_in_main_drain &&
 		    (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_target_at_state)) {
 			/*
 			 * Here we don't have to worry about probe-rtt
 			 * re-slam it, but keep it slammed down.
 			 */
 			bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 		}
 		if (inflight <= bbr->r_ctl.rc_target_at_state) {
 			/* We have drained */
 			bbr->rc_bbr_state = BBR_STATE_PROBE_BW;
 			bbr->r_ctl.bbr_lost_at_state = bbr->r_ctl.rc_lost;
 			if (SEQ_GT(cts, bbr->r_ctl.rc_bbr_state_time)) {
 				uint32_t time_in;
 
 				time_in = cts - bbr->r_ctl.rc_bbr_state_time;
 				counter_u64_add(bbr_state_time[bbr->rc_bbr_state], time_in);
 			}
 			if ((bbr->rc_use_google == 0) &&
 			    bbr_slam_cwnd_in_main_drain &&
 			    (tp->snd_cwnd < bbr->r_ctl.rc_saved_cwnd)) {
 				/* Restore the cwnd */
 				tp->snd_cwnd = bbr->r_ctl.rc_saved_cwnd;
 				bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 			}
 			/* Setup probe-rtt has being done now RRS-HERE */
 			bbr->r_ctl.rc_rtt_shrinks = cts;
 			bbr->r_ctl.last_in_probertt = cts;
 			bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_LEAVE_DRAIN, 0);
 			/* Randomly pick a sub-state */
 			bbr->rc_bbr_substate = bbr_pick_probebw_substate(bbr, cts);
 			bbr_substate_change(bbr, cts, __LINE__, 0);
 			bbr_log_type_statechange(bbr, cts, __LINE__);
 		}
 	} else if (bbr->rc_bbr_state == BBR_STATE_PROBE_RTT) {
 		uint32_t flight;
 
 		flight = ctf_flight_size(bbr->rc_tp,
 			     (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		bbr->r_ctl.r_app_limited_until = (flight + bbr->r_ctl.rc_delivered);
 		if (((bbr->r_ctl.bbr_rttprobe_gain_val == 0) || bbr->rc_use_google) &&
 		    (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_target_at_state)) {
 			/*
 			 * We must keep cwnd at the desired MSS.
 			 */
 			bbr->rc_tp->snd_cwnd = bbr_rtt_probe_cwndtarg * (bbr->rc_tp->t_maxseg - bbr->rc_last_options);
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 		} else if ((bbr_prtt_slam_cwnd) &&
 			   (bbr->rc_tp->snd_cwnd > bbr->r_ctl.rc_target_at_state)) {
 			/* Re-slam it */
 			bbr->rc_tp->snd_cwnd = bbr->r_ctl.rc_target_at_state;
 			bbr_log_type_cwndupd(bbr, 0, 0, 0, 12, 0, 0, __LINE__);
 		}
 		if (bbr->r_ctl.rc_bbr_enters_probertt == 0) {
 			/* Has outstanding reached our target? */
 			if (flight <= bbr->r_ctl.rc_target_at_state) {
 				bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_REACHTAR, 0);
 				bbr->r_ctl.rc_bbr_enters_probertt = cts;
 				/* If time is exactly 0, be 1usec off */
 				if (bbr->r_ctl.rc_bbr_enters_probertt == 0)
 					bbr->r_ctl.rc_bbr_enters_probertt = 1;
 				if (bbr->rc_use_google == 0) {
 					/*
 					 * Restore any lowering that as occurred to
 					 * reach here
 					 */
 					if (bbr->r_ctl.bbr_rttprobe_gain_val)
 						bbr->r_ctl.rc_bbr_hptsi_gain = bbr->r_ctl.bbr_rttprobe_gain_val;
 					else
 						bbr->r_ctl.rc_bbr_hptsi_gain = BBR_UNIT;
 				}
 			}
 			if ((bbr->r_ctl.rc_bbr_enters_probertt == 0) &&
 			    (bbr->rc_use_google == 0) &&
 			    bbr->r_ctl.bbr_rttprobe_gain_val &&
 			    (((cts - bbr->r_ctl.rc_probertt_srttchktim) > bbr_get_rtt(bbr, bbr_drain_rtt)) ||
 			     (flight >= bbr->r_ctl.flightsize_at_drain))) {
 				/*
 				 * We have doddled with our current hptsi
 				 * gain an srtt and have still not made it
 				 * to target, or we have increased our flight.
 				 * Lets reduce the gain by xx%
 				 * flooring the reduce at DRAIN (based on
 				 * mul/div)
 				 */
 				int red;
 
 				bbr->r_ctl.flightsize_at_drain = flight;
 				bbr->r_ctl.rc_probertt_srttchktim = cts;
 				red = max((bbr->r_ctl.bbr_rttprobe_gain_val / 10), 1);
 				if ((bbr->r_ctl.rc_bbr_hptsi_gain - red) > max(bbr_drain_floor, 1)) {
 					/* Reduce our gain again */
 					bbr->r_ctl.rc_bbr_hptsi_gain -= red;
 					bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_SHRINK_PG, 0);
 				} else if (bbr->r_ctl.rc_bbr_hptsi_gain > max(bbr_drain_floor, 1)) {
 					/* one more chance before we give up */
 					bbr->r_ctl.rc_bbr_hptsi_gain = max(bbr_drain_floor, 1);
 					bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_SHRINK_PG_FINAL, 0);
 				} else {
 					/* At the very bottom */
 					bbr->r_ctl.rc_bbr_hptsi_gain = max((bbr_drain_floor-1), 1);
 				}
 			}
 		}
 		if (bbr->r_ctl.rc_bbr_enters_probertt &&
 		    (TSTMP_GT(cts, bbr->r_ctl.rc_bbr_enters_probertt)) &&
 		    ((cts - bbr->r_ctl.rc_bbr_enters_probertt) >= bbr_rtt_probe_time)) {
 			/* Time to exit probe RTT normally */
 			bbr_exit_probe_rtt(bbr->rc_tp, bbr, cts);
 		}
 	} else if (bbr->rc_bbr_state == BBR_STATE_PROBE_BW) {
 		if ((bbr->rc_tp->snd_una == bbr->rc_tp->snd_max) &&
 		    (bbr_calc_time(cts, bbr->r_ctl.rc_went_idle_time) >= bbr_rtt_probe_time)) {
 			/*
 			 * This qualifies as a RTT_PROBE session since we
 			 * drop the data outstanding to nothing and waited
 			 * more than bbr_rtt_probe_time.
 			 */
 			bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_WASIDLE, 0);
 			bbr_set_reduced_rtt(bbr, cts, __LINE__);
 		}
 		if (bbr_should_enter_probe_rtt(bbr, cts)) {
 			bbr_enter_probe_rtt(bbr, cts, __LINE__);
 		} else {
 			bbr_set_probebw_gains(bbr, cts, losses);
 		}
 	}
 }
 
 static void
 bbr_check_bbr_for_state(struct tcp_bbr *bbr, uint32_t cts, int32_t line, uint32_t losses)
 {
 	int32_t epoch = 0;
 
 	if ((cts - bbr->r_ctl.rc_rcv_epoch_start) >= bbr_get_rtt(bbr, BBR_RTT_PROP)) {
 		bbr_set_epoch(bbr, cts, line);
 		/* At each epoch doe lt bw sampling */
 		epoch = 1;
 	}
 	bbr_state_change(bbr, cts, epoch, bbr->rc_is_pkt_epoch_now, losses);
 }
 
 static int
 bbr_do_segment_nounlock(struct tcpcb *tp, struct mbuf *m, struct tcphdr *th,
     int32_t drop_hdrlen, int32_t tlen, uint8_t iptos, int32_t nxt_pkt,
     struct timeval *tv)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct socket *so = tptosocket(tp);
 	int32_t thflags, retval;
 	uint32_t cts, lcts;
 	uint32_t tiwin;
 	struct tcpopt to;
 	struct tcp_bbr *bbr;
 	struct bbr_sendmap *rsm;
 	struct timeval ltv;
 	int32_t did_out = 0;
 	uint16_t nsegs;
 	int32_t prev_state;
 	uint32_t lost;
 
 	nsegs = max(1, m->m_pkthdr.lro_nsegs);
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	/* add in our stats */
 	kern_prefetch(bbr, &prev_state);
 	prev_state = 0;
 	thflags = tcp_get_flags(th);
 	/*
 	 * If this is either a state-changing packet or current state isn't
 	 * established, we require a write lock on tcbinfo.  Otherwise, we
 	 * allow the tcbinfo to be in either alocked or unlocked, as the
 	 * caller may have unnecessarily acquired a write lock due to a
 	 * race.
 	 */
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	KASSERT(tp->t_state > TCPS_LISTEN, ("%s: TCPS_LISTEN",
 	    __func__));
 	KASSERT(tp->t_state != TCPS_TIME_WAIT, ("%s: TCPS_TIME_WAIT",
 	    __func__));
 
 	tp->t_rcvtime = ticks;
 	/*
 	 * Unscale the window into a 32-bit value. For the SYN_SENT state
 	 * the scale is zero.
 	 */
 	tiwin = th->th_win << tp->snd_scale;
 #ifdef STATS
 	stats_voi_update_abs_ulong(tp->t_stats, VOI_TCP_FRWIN, tiwin);
 #endif
 
 	if (m->m_flags & M_TSTMP) {
 		/* Prefer the hardware timestamp if present */
 		struct timespec ts;
 
 		mbuf_tstmp2timespec(m, &ts);
 		bbr->rc_tv.tv_sec = ts.tv_sec;
 		bbr->rc_tv.tv_usec = ts.tv_nsec / 1000;
 		bbr->r_ctl.rc_rcvtime = cts = tcp_tv_to_usectick(&bbr->rc_tv);
 	} else if (m->m_flags & M_TSTMP_LRO) {
 		/* Next the arrival timestamp */
 		struct timespec ts;
 
 		mbuf_tstmp2timespec(m, &ts);
 		bbr->rc_tv.tv_sec = ts.tv_sec;
 		bbr->rc_tv.tv_usec = ts.tv_nsec / 1000;
 		bbr->r_ctl.rc_rcvtime = cts = tcp_tv_to_usectick(&bbr->rc_tv);
 	} else {
 		/*
 		 * Ok just get the current time.
 		 */
 		bbr->r_ctl.rc_rcvtime = lcts = cts = tcp_get_usecs(&bbr->rc_tv);
 	}
 	/*
 	 * Parse options on any incoming segment.
 	 */
 	tcp_dooptions(&to, (u_char *)(th + 1),
 	    (th->th_off << 2) - sizeof(struct tcphdr),
 	    (thflags & TH_SYN) ? TO_SYN : 0);
 
 	/*
 	 * If timestamps were negotiated during SYN/ACK and a
 	 * segment without a timestamp is received, silently drop
 	 * the segment, unless it is a RST segment or missing timestamps are
 	 * tolerated.
 	 * See section 3.2 of RFC 7323.
 	 */
 	if ((tp->t_flags & TF_RCVD_TSTMP) && !(to.to_flags & TOF_TS) &&
 	    ((thflags & TH_RST) == 0) && (V_tcp_tolerate_missing_ts == 0)) {
 		retval = 0;
 		m_freem(m);
 		goto done_with_input;
 	}
 	/*
 	 * If echoed timestamp is later than the current time, fall back to
 	 * non RFC1323 RTT calculation.  Normalize timestamp if syncookies
 	 * were used when this connection was established.
 	 */
 	if ((to.to_flags & TOF_TS) && (to.to_tsecr != 0)) {
 		to.to_tsecr -= tp->ts_offset;
 		if (TSTMP_GT(to.to_tsecr, tcp_tv_to_mssectick(&bbr->rc_tv)))
 			to.to_tsecr = 0;
 	}
 	/*
 	 * If its the first time in we need to take care of options and
 	 * verify we can do SACK for rack!
 	 */
 	if (bbr->r_state == 0) {
 		/*
 		 * Process options only when we get SYN/ACK back. The SYN
 		 * case for incoming connections is handled in tcp_syncache.
 		 * According to RFC1323 the window field in a SYN (i.e., a
 		 * <SYN> or <SYN,ACK>) segment itself is never scaled. XXX
 		 * this is traditional behavior, may need to be cleaned up.
 		 */
 		if (bbr->rc_inp == NULL) {
 			bbr->rc_inp = inp;
 		}
 		/*
 		 * We need to init rc_inp here since its not init'd when
 		 * bbr_init is called
 		 */
 		if (tp->t_state == TCPS_SYN_SENT && (thflags & TH_SYN)) {
 			if ((to.to_flags & TOF_SCALE) &&
 			    (tp->t_flags & TF_REQ_SCALE)) {
 				tp->t_flags |= TF_RCVD_SCALE;
 				tp->snd_scale = to.to_wscale;
 			} else
 				tp->t_flags &= ~TF_REQ_SCALE;
 			/*
 			 * Initial send window.  It will be updated with the
 			 * next incoming segment to the scaled value.
 			 */
 			tp->snd_wnd = th->th_win;
 			if ((to.to_flags & TOF_TS) &&
 			    (tp->t_flags & TF_REQ_TSTMP)) {
 				tp->t_flags |= TF_RCVD_TSTMP;
 				tp->ts_recent = to.to_tsval;
 				tp->ts_recent_age = tcp_tv_to_mssectick(&bbr->rc_tv);
 			} else
 			    tp->t_flags &= ~TF_REQ_TSTMP;
 			if (to.to_flags & TOF_MSS)
 				tcp_mss(tp, to.to_mss);
 			if ((tp->t_flags & TF_SACK_PERMIT) &&
 			    (to.to_flags & TOF_SACKPERM) == 0)
 				tp->t_flags &= ~TF_SACK_PERMIT;
 			if (IS_FASTOPEN(tp->t_flags)) {
 				if (to.to_flags & TOF_FASTOPEN) {
 					uint16_t mss;
 
 					if (to.to_flags & TOF_MSS)
 						mss = to.to_mss;
 					else
 						if ((inp->inp_vflag & INP_IPV6) != 0)
 							mss = TCP6_MSS;
 						else
 							mss = TCP_MSS;
 					tcp_fastopen_update_cache(tp, mss,
 					    to.to_tfo_len, to.to_tfo_cookie);
 				} else
 					tcp_fastopen_disable_path(tp);
 			}
 		}
 		/*
 		 * At this point we are at the initial call. Here we decide
 		 * if we are doing RACK or not. We do this by seeing if
 		 * TF_SACK_PERMIT is set, if not rack is *not* possible and
 		 * we switch to the default code.
 		 */
 		if ((tp->t_flags & TF_SACK_PERMIT) == 0) {
 			/* Bail */
 			tcp_switch_back_to_default(tp);
 			(*tp->t_fb->tfb_tcp_do_segment)(tp, m, th, drop_hdrlen,
 			    tlen, iptos);
 			return (1);
 		}
 		/* Set the flag */
 		bbr->r_is_v6 = (inp->inp_vflag & INP_IPV6) != 0;
 		tcp_set_hpts(tp);
 		sack_filter_clear(&bbr->r_ctl.bbr_sf, th->th_ack);
 	}
 	if (thflags & TH_ACK) {
 		/* Track ack types */
 		if (to.to_flags & TOF_SACK)
 			BBR_STAT_INC(bbr_acks_with_sacks);
 		else
 			BBR_STAT_INC(bbr_plain_acks);
 	}
 	/*
 	 * This is the one exception case where we set the rack state
 	 * always. All other times (timers etc) we must have a rack-state
 	 * set (so we assure we have done the checks above for SACK).
 	 */
 	if (thflags & TH_FIN)
 		tcp_log_end_status(tp, TCP_EI_STATUS_CLIENT_FIN);
 	if (bbr->r_state != tp->t_state)
 		bbr_set_state(tp, bbr, tiwin);
 
 	if (SEQ_GT(th->th_ack, tp->snd_una) && (rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map)) != NULL)
 		kern_prefetch(rsm, &prev_state);
 	prev_state = bbr->r_state;
 	bbr->rc_ack_was_delayed = 0;
 	lost = bbr->r_ctl.rc_lost;
 	bbr->rc_is_pkt_epoch_now = 0;
 	if (m->m_flags & (M_TSTMP|M_TSTMP_LRO)) {
 		/* Get the real time into lcts and figure the real delay */
 		lcts = tcp_get_usecs(&ltv);
 		if (TSTMP_GT(lcts, cts)) {
 			bbr->r_ctl.rc_ack_hdwr_delay = lcts - cts;
 			bbr->rc_ack_was_delayed = 1;
 			if (TSTMP_GT(bbr->r_ctl.rc_ack_hdwr_delay,
 				     bbr->r_ctl.highest_hdwr_delay))
 				bbr->r_ctl.highest_hdwr_delay = bbr->r_ctl.rc_ack_hdwr_delay;
 		} else {
 			bbr->r_ctl.rc_ack_hdwr_delay = 0;
 			bbr->rc_ack_was_delayed = 0;
 		}
 	} else {
 		bbr->r_ctl.rc_ack_hdwr_delay = 0;
 		bbr->rc_ack_was_delayed = 0;
 	}
 	bbr_log_ack_event(bbr, th, &to, tlen, nsegs, cts, nxt_pkt, m);
 	if ((thflags & TH_SYN) && (thflags & TH_FIN) && V_drop_synfin) {
 		retval = 0;
 		m_freem(m);
 		goto done_with_input;
 	}
 	/*
 	 * If a segment with the ACK-bit set arrives in the SYN-SENT state
 	 * check SEQ.ACK first as described on page 66 of RFC 793, section 3.9.
 	 */
 	if ((tp->t_state == TCPS_SYN_SENT) && (thflags & TH_ACK) &&
 	    (SEQ_LEQ(th->th_ack, tp->iss) || SEQ_GT(th->th_ack, tp->snd_max))) {
 		tcp_log_end_status(tp, TCP_EI_STATUS_RST_IN_FRONT);
 		ctf_do_dropwithreset_conn(m, tp, th, BANDLIM_RST_OPENPORT, tlen);
 		return (1);
 	}
 	if (tiwin > bbr->r_ctl.rc_high_rwnd)
 		bbr->r_ctl.rc_high_rwnd = tiwin;
 	bbr->r_ctl.rc_flight_at_input = ctf_flight_size(tp,
 					    (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 	bbr->rtt_valid = 0;
 	if (to.to_flags & TOF_TS) {
 		bbr->rc_ts_valid = 1;
 		bbr->r_ctl.last_inbound_ts = to.to_tsval;
 	} else {
 		bbr->rc_ts_valid = 0;
 		bbr->r_ctl.last_inbound_ts = 0;
 	}
 	retval = (*bbr->r_substate) (m, th, so,
 	    tp, &to, drop_hdrlen,
 	    tlen, tiwin, thflags, nxt_pkt, iptos);
 	if (nxt_pkt == 0)
 		BBR_STAT_INC(bbr_rlock_left_ret0);
 	else
 		BBR_STAT_INC(bbr_rlock_left_ret1);
 	if (retval == 0) {
 		/*
 		 * If retval is 1 the tcb is unlocked and most likely the tp
 		 * is gone.
 		 */
 		INP_WLOCK_ASSERT(inp);
 		tcp_bbr_xmit_timer_commit(bbr, tp, cts);
 		if (bbr->rc_is_pkt_epoch_now)
 			bbr_set_pktepoch(bbr, cts, __LINE__);
 		bbr_check_bbr_for_state(bbr, cts, __LINE__, (bbr->r_ctl.rc_lost - lost));
 		if (nxt_pkt == 0) {
 			if (bbr->r_wanted_output != 0) {
 				bbr->rc_output_starts_timer = 0;
 				did_out = 1;
 				if (tcp_output(tp) < 0)
 					return (1);
 			} else
 				bbr_start_hpts_timer(bbr, tp, cts, 6, 0, 0);
 		}
 		if ((nxt_pkt == 0) &&
 		    ((bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK) == 0) &&
 		    (SEQ_GT(tp->snd_max, tp->snd_una) ||
 		     (tp->t_flags & TF_DELACK) ||
 		     ((V_tcp_always_keepalive || bbr->rc_inp->inp_socket->so_options & SO_KEEPALIVE) &&
 		      (tp->t_state <= TCPS_CLOSING)))) {
 			/*
 			 * We could not send (probably in the hpts but
 			 * stopped the timer)?
 			 */
 			if ((tp->snd_max == tp->snd_una) &&
 			    ((tp->t_flags & TF_DELACK) == 0) &&
 			    (tcp_in_hpts(tp)) &&
 			    (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT)) {
 				/*
 				 * keep alive not needed if we are hptsi
 				 * output yet
 				 */
 				;
 			} else {
 				if (tcp_in_hpts(tp)) {
 					tcp_hpts_remove(tp);
 					if ((bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) &&
 					    (TSTMP_GT(lcts, bbr->rc_pacer_started))) {
 						uint32_t del;
 
 						del = lcts - bbr->rc_pacer_started;
 						if (bbr->r_ctl.rc_last_delay_val > del) {
 							BBR_STAT_INC(bbr_force_timer_start);
 							bbr->r_ctl.rc_last_delay_val -= del;
 							bbr->rc_pacer_started = lcts;
 						} else {
 							/* We are late */
 							bbr->r_ctl.rc_last_delay_val = 0;
 							BBR_STAT_INC(bbr_force_output);
 							if (tcp_output(tp) < 0)
 								return (1);
 						}
 					}
 				}
 				bbr_start_hpts_timer(bbr, tp, cts, 8, bbr->r_ctl.rc_last_delay_val,
 				    0);
 			}
 		} else if ((bbr->rc_output_starts_timer == 0) && (nxt_pkt == 0)) {
 			/* Do we have the correct timer running? */
 			bbr_timer_audit(tp, bbr, lcts, &so->so_snd);
 		}
 		/* Clear the flag, it may have been cleared by output but we may not have  */
 		if ((nxt_pkt == 0) && (tp->t_flags2 & TF2_HPTS_CALLS))
 			tp->t_flags2 &= ~TF2_HPTS_CALLS;
 		/* Do we have a new state */
 		if (bbr->r_state != tp->t_state)
 			bbr_set_state(tp, bbr, tiwin);
 done_with_input:
 		bbr_log_doseg_done(bbr, cts, nxt_pkt, did_out);
 		if (did_out)
 			bbr->r_wanted_output = 0;
 	}
 	return (retval);
 }
 
 static void
 bbr_do_segment(struct tcpcb *tp, struct mbuf *m, struct tcphdr *th,
     int32_t drop_hdrlen, int32_t tlen, uint8_t iptos)
 {
 	struct timeval tv;
 	int retval;
 
 	/* First lets see if we have old packets */
 	if (!STAILQ_EMPTY(&tp->t_inqueue)) {
 		if (ctf_do_queued_segments(tp, 1)) {
 			m_freem(m);
 			return;
 		}
 	}
 	if (m->m_flags & M_TSTMP_LRO) {
 		mbuf_tstmp2timeval(m, &tv);
 	} else {
 		/* Should not be should we kassert instead? */
 		tcp_get_usecs(&tv);
 	}
 	retval = bbr_do_segment_nounlock(tp, m, th, drop_hdrlen, tlen, iptos,
 	    0, &tv);
 	if (retval == 0) {
 		INP_WUNLOCK(tptoinpcb(tp));
 	}
 }
 
 /*
  * Return how much data can be sent without violating the
  * cwnd or rwnd.
  */
 
 static inline uint32_t
 bbr_what_can_we_send(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t sendwin,
     uint32_t avail, int32_t sb_offset, uint32_t cts)
 {
 	uint32_t len;
 
 	if (ctf_outstanding(tp) >= tp->snd_wnd) {
 		/* We never want to go over our peers rcv-window */
 		len = 0;
 	} else {
 		uint32_t flight;
 
 		flight = ctf_flight_size(tp, (bbr->r_ctl.rc_sacked + bbr->r_ctl.rc_lost_bytes));
 		if (flight >= sendwin) {
 			/*
 			 * We have in flight what we are allowed by cwnd (if
 			 * it was rwnd blocking it would have hit above out
 			 * >= tp->snd_wnd).
 			 */
 			return (0);
 		}
 		len = sendwin - flight;
 		if ((len + ctf_outstanding(tp)) > tp->snd_wnd) {
 			/* We would send too much (beyond the rwnd) */
 			len = tp->snd_wnd - ctf_outstanding(tp);
 		}
 		if ((len + sb_offset) > avail) {
 			/*
 			 * We don't have that much in the SB, how much is
 			 * there?
 			 */
 			len = avail - sb_offset;
 		}
 	}
 	return (len);
 }
 
 static inline void
 bbr_do_send_accounting(struct tcpcb *tp, struct tcp_bbr *bbr, struct bbr_sendmap *rsm, int32_t len, int32_t error)
 {
 	if (error) {
 		return;
 	}
 	if (rsm) {
 		if (rsm->r_flags & BBR_TLP) {
 			/*
 			 * TLP should not count in retran count, but in its
 			 * own bin
 			 */
 			KMOD_TCPSTAT_INC(tcps_tlpresends);
 			KMOD_TCPSTAT_ADD(tcps_tlpresend_bytes, len);
 		} else {
 			/* Retransmit */
 			tp->t_sndrexmitpack++;
 			KMOD_TCPSTAT_INC(tcps_sndrexmitpack);
 			KMOD_TCPSTAT_ADD(tcps_sndrexmitbyte, len);
 #ifdef STATS
 			stats_voi_update_abs_u32(tp->t_stats, VOI_TCP_RETXPB,
 			    len);
 #endif
 		}
 		/*
 		 * Logs in 0 - 8, 8 is all non probe_bw states 0-7 is
 		 * sub-state
 		 */
 		counter_u64_add(bbr_state_lost[rsm->r_bbr_state], len);
 		if (bbr->rc_bbr_state != BBR_STATE_PROBE_BW) {
 			/* Non probe_bw log in 1, 2, or 4. */
 			counter_u64_add(bbr_state_resend[bbr->rc_bbr_state], len);
 		} else {
 			/*
 			 * Log our probe state 3, and log also 5-13 to show
 			 * us the recovery sub-state for the send. This
 			 * means that 3 == (5+6+7+8+9+10+11+12+13)
 			 */
 			counter_u64_add(bbr_state_resend[BBR_STATE_PROBE_BW], len);
 			counter_u64_add(bbr_state_resend[(bbr_state_val(bbr) + 5)], len);
 		}
 		/* Place in both 16's the totals of retransmitted */
 		counter_u64_add(bbr_state_lost[16], len);
 		counter_u64_add(bbr_state_resend[16], len);
 		/* Place in 17's the total sent */
 		counter_u64_add(bbr_state_resend[17], len);
 		counter_u64_add(bbr_state_lost[17], len);
 
 	} else {
 		/* New sends */
 		KMOD_TCPSTAT_INC(tcps_sndpack);
 		KMOD_TCPSTAT_ADD(tcps_sndbyte, len);
 		/* Place in 17's the total sent */
 		counter_u64_add(bbr_state_resend[17], len);
 		counter_u64_add(bbr_state_lost[17], len);
 #ifdef STATS
 		stats_voi_update_abs_u64(tp->t_stats, VOI_TCP_TXPB,
 		    len);
 #endif
 	}
 }
 
 static void
 bbr_cwnd_limiting(struct tcpcb *tp, struct tcp_bbr *bbr, uint32_t in_level)
 {
 	if (bbr->rc_filled_pipe && bbr_target_cwnd_mult_limit && (bbr->rc_use_google == 0)) {
 		/*
 		 * Limit the cwnd to not be above N x the target plus whats
 		 * is outstanding. The target is based on the current b/w
 		 * estimate.
 		 */
 		uint32_t target;
 
 		target = bbr_get_target_cwnd(bbr, bbr_get_bw(bbr), BBR_UNIT);
 		target += ctf_outstanding(tp);
 		target *= bbr_target_cwnd_mult_limit;
 		if (tp->snd_cwnd > target)
 			tp->snd_cwnd = target;
 		bbr_log_type_cwndupd(bbr, 0, 0, 0, 10, 0, 0, __LINE__);
 	}
 }
 
 static int
 bbr_window_update_needed(struct tcpcb *tp, struct socket *so, uint32_t recwin, int32_t maxseg)
 {
 	/*
 	 * "adv" is the amount we could increase the window, taking into
 	 * account that we are limited by TCP_MAXWIN << tp->rcv_scale.
 	 */
 	int32_t adv;
 	int32_t oldwin;
 
 	adv = recwin;
 	if (SEQ_GT(tp->rcv_adv, tp->rcv_nxt)) {
 		oldwin = (tp->rcv_adv - tp->rcv_nxt);
 		if (adv > oldwin)
 			adv -= oldwin;
 		else {
 			/* We can't increase the window */
 			adv = 0;
 		}
 	} else
 		oldwin = 0;
 
 	/*
 	 * If the new window size ends up being the same as or less
 	 * than the old size when it is scaled, then don't force
 	 * a window update.
 	 */
 	if (oldwin >> tp->rcv_scale >= (adv + oldwin) >> tp->rcv_scale)
 		return (0);
 
 	if (adv >= (2 * maxseg) &&
 	    (adv >= (so->so_rcv.sb_hiwat / 4) ||
 	    recwin <= (so->so_rcv.sb_hiwat / 8) ||
 	    so->so_rcv.sb_hiwat <= 8 * maxseg)) {
 		return (1);
 	}
 	if (2 * adv >= (int32_t) so->so_rcv.sb_hiwat)
 		return (1);
 	return (0);
 }
 
 /*
  * Return 0 on success and a errno on failure to send.
  * Note that a 0 return may not mean we sent anything
  * if the TCB was on the hpts. A non-zero return
  * does indicate the error we got from ip[6]_output.
  */
 static int
 bbr_output_wtime(struct tcpcb *tp, const struct timeval *tv)
 {
 	struct socket *so;
 	int32_t len;
 	uint32_t cts;
 	uint32_t recwin, sendwin;
 	int32_t sb_offset;
 	int32_t flags, abandon, error = 0;
 	struct tcp_log_buffer *lgb = NULL;
 	struct mbuf *m;
 	struct mbuf *mb;
 	uint32_t if_hw_tsomaxsegcount = 0;
 	uint32_t if_hw_tsomaxsegsize = 0;
 	uint32_t if_hw_tsomax = 0;
 	struct ip *ip = NULL;
 	struct tcp_bbr *bbr;
 	struct tcphdr *th;
 	struct udphdr *udp = NULL;
 	u_char opt[TCP_MAXOLEN];
 	unsigned ipoptlen, optlen, hdrlen;
 	unsigned ulen;
 	uint32_t bbr_seq;
 	uint32_t delay_calc=0;
 	uint8_t doing_tlp = 0;
 	uint8_t local_options;
 #ifdef BBR_INVARIANTS
 	uint8_t doing_retran_from = 0;
 	uint8_t picked_up_retran = 0;
 #endif
 	uint8_t wanted_cookie = 0;
 	uint8_t more_to_rxt=0;
 	int32_t prefetch_so_done = 0;
 	int32_t prefetch_rsm = 0;
 	uint32_t tot_len = 0;
 	uint32_t maxseg, pace_max_segs, p_maxseg;
 	int32_t csum_flags = 0;
  	int32_t hw_tls;
 #if defined(IPSEC) || defined(IPSEC_SUPPORT)
 	unsigned ipsec_optlen = 0;
 
 #endif
 	volatile int32_t sack_rxmit;
 	struct bbr_sendmap *rsm = NULL;
 	int32_t tso, mtu;
 	struct tcpopt to;
 	int32_t slot = 0;
 	struct inpcb *inp;
 	struct sockbuf *sb;
 	bool hpts_calling;
 #ifdef INET6
 	struct ip6_hdr *ip6 = NULL;
 	int32_t isipv6;
 #endif
 	uint8_t app_limited = BBR_JR_SENT_DATA;
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	/* We take a cache hit here */
 	memcpy(&bbr->rc_tv, tv, sizeof(struct timeval));
 	cts = tcp_tv_to_usectick(&bbr->rc_tv);
 	inp = bbr->rc_inp;
 	hpts_calling = !!(tp->t_flags2 & TF2_HPTS_CALLS);
 	tp->t_flags2 &= ~TF2_HPTS_CALLS;
 	so = inp->inp_socket;
 	sb = &so->so_snd;
 	if (tp->t_nic_ktls_xmit)
  		hw_tls = 1;
  	else
  		hw_tls = 0;
 	kern_prefetch(sb, &maxseg);
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	if (bbr_minseg(bbr) < maxseg) {
 		tcp_bbr_tso_size_check(bbr, cts);
 	}
 	/* Remove any flags that indicate we are pacing on the inp  */
 	pace_max_segs = bbr->r_ctl.rc_pace_max_segs;
 	p_maxseg = min(maxseg, pace_max_segs);
 	INP_WLOCK_ASSERT(inp);
 #ifdef TCP_OFFLOAD
 	if (tp->t_flags & TF_TOE)
 		return (tcp_offload_output(tp));
 #endif
 
 #ifdef INET6
 	if (bbr->r_state) {
 		/* Use the cache line loaded if possible */
 		isipv6 = bbr->r_is_v6;
 	} else {
 		isipv6 = (inp->inp_vflag & INP_IPV6) != 0;
 	}
 #endif
 	if (((bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) == 0) &&
 	    tcp_in_hpts(tp)) {
 		/*
 		 * We are on the hpts for some timer but not hptsi output.
 		 * Possibly remove from the hpts so we can send/recv etc.
 		 */
 		if ((tp->t_flags & TF_ACKNOW) == 0) {
 			/*
 			 * No immediate demand right now to send an ack, but
 			 * the user may have read, making room for new data
 			 * (a window update). If so we may want to cancel
 			 * whatever timer is running (KEEP/DEL-ACK?) and
 			 * continue to send out a window update. Or we may
 			 * have gotten more data into the socket buffer to
 			 * send.
 			 */
 			recwin = lmin(lmax(sbspace(&so->so_rcv), 0),
 				      (long)TCP_MAXWIN << tp->rcv_scale);
 			if ((bbr_window_update_needed(tp, so, recwin, maxseg) == 0) &&
 			    ((tcp_outflags[tp->t_state] & TH_RST) == 0) &&
 			    ((sbavail(sb) + ((tcp_outflags[tp->t_state] & TH_FIN) ? 1 : 0)) <=
 			    (tp->snd_max - tp->snd_una))) {
 				/*
 				 * Nothing new to send and no window update
 				 * is needed to send. Lets just return and
 				 * let the timer-run off.
 				 */
 				return (0);
 			}
 		}
 		tcp_hpts_remove(tp);
 		bbr_timer_cancel(bbr, __LINE__, cts);
 	}
 	if (bbr->r_ctl.rc_last_delay_val) {
 		/* Calculate a rough delay for early escape to sending  */
 		if (SEQ_GT(cts, bbr->rc_pacer_started))
 			delay_calc = cts - bbr->rc_pacer_started;
 		if (delay_calc >= bbr->r_ctl.rc_last_delay_val)
 			delay_calc -= bbr->r_ctl.rc_last_delay_val;
 		else
 			delay_calc = 0;
 	}
 	/* Mark that we have called bbr_output(). */
 	if ((bbr->r_timer_override) ||
 	    (tp->t_state < TCPS_ESTABLISHED)) {
 		/* Timeouts or early states are exempt */
 		if (tcp_in_hpts(tp))
 			tcp_hpts_remove(tp);
 	} else if (tcp_in_hpts(tp)) {
 		if ((bbr->r_ctl.rc_last_delay_val) &&
 		    (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) &&
 		    delay_calc) {
 			/*
 			 * We were being paced for output and the delay has
 			 * already exceeded when we were supposed to be
 			 * called, lets go ahead and pull out of the hpts
 			 * and call output.
 			 */
 			counter_u64_add(bbr_out_size[TCP_MSS_ACCT_LATE], 1);
 			bbr->r_ctl.rc_last_delay_val = 0;
 			tcp_hpts_remove(tp);
 		} else if (tp->t_state == TCPS_CLOSED) {
 			bbr->r_ctl.rc_last_delay_val = 0;
 			tcp_hpts_remove(tp);
 		} else {
 			/*
 			 * On the hpts, you shall not pass! even if ACKNOW
 			 * is on, we will when the hpts fires, unless of
 			 * course we are overdue.
 			 */
 			counter_u64_add(bbr_out_size[TCP_MSS_ACCT_INPACE], 1);
 			return (0);
 		}
 	}
 	bbr->rc_cwnd_limited = 0;
 	if (bbr->r_ctl.rc_last_delay_val) {
 		/* recalculate the real delay and deal with over/under  */
 		if (SEQ_GT(cts, bbr->rc_pacer_started))
 			delay_calc = cts - bbr->rc_pacer_started;
 		else
 			delay_calc = 0;
 		if (delay_calc >= bbr->r_ctl.rc_last_delay_val)
 			/* Setup the delay which will be added in */
 			delay_calc -= bbr->r_ctl.rc_last_delay_val;
 		else {
 			/*
 			 * We are early setup to adjust
 			 * our slot time.
 			 */
 			uint64_t merged_val;
 
 			bbr->r_ctl.rc_agg_early += (bbr->r_ctl.rc_last_delay_val - delay_calc);
 			bbr->r_agg_early_set = 1;
 			if (bbr->r_ctl.rc_hptsi_agg_delay) {
 				if (bbr->r_ctl.rc_hptsi_agg_delay >= bbr->r_ctl.rc_agg_early) {
 					/* Nope our previous late cancels out the early */
 					bbr->r_ctl.rc_hptsi_agg_delay -= bbr->r_ctl.rc_agg_early;
 					bbr->r_agg_early_set = 0;
 					bbr->r_ctl.rc_agg_early = 0;
 				} else {
 					bbr->r_ctl.rc_agg_early -= bbr->r_ctl.rc_hptsi_agg_delay;
 					bbr->r_ctl.rc_hptsi_agg_delay = 0;
 				}
 			}
 			merged_val = bbr->rc_pacer_started;
 			merged_val <<= 32;
 			merged_val |= bbr->r_ctl.rc_last_delay_val;
 			bbr_log_pacing_delay_calc(bbr, hpts_calling,
 						 bbr->r_ctl.rc_agg_early, cts, delay_calc, merged_val,
 						 bbr->r_agg_early_set, 3);
 			bbr->r_ctl.rc_last_delay_val = 0;
 			BBR_STAT_INC(bbr_early);
 			delay_calc = 0;
 		}
 	} else {
 		/* We were not delayed due to hptsi */
 		if (bbr->r_agg_early_set)
 			bbr->r_ctl.rc_agg_early = 0;
 		bbr->r_agg_early_set = 0;
 		delay_calc = 0;
 	}
 	if (delay_calc) {
 		/*
 		 * We had a hptsi delay which means we are falling behind on
 		 * sending at the expected rate. Calculate an extra amount
 		 * of data we can send, if any, to put us back on track.
 		 */
 		if ((bbr->r_ctl.rc_hptsi_agg_delay + delay_calc) < bbr->r_ctl.rc_hptsi_agg_delay)
 			bbr->r_ctl.rc_hptsi_agg_delay = 0xffffffff;
 		else
 			bbr->r_ctl.rc_hptsi_agg_delay += delay_calc;
 	}
 	sendwin = min(tp->snd_wnd, tp->snd_cwnd);
 	if ((tp->snd_una == tp->snd_max) &&
 	    (bbr->rc_bbr_state != BBR_STATE_IDLE_EXIT) &&
 	    (sbavail(sb))) {
 		/*
 		 * Ok we have been idle with nothing outstanding
 		 * we possibly need to start fresh with either a new
 		 * suite of states or a fast-ramp up.
 		 */
 		bbr_restart_after_idle(bbr,
 				       cts, bbr_calc_time(cts, bbr->r_ctl.rc_went_idle_time));
 	}
 	/*
 	 * Now was there a hptsi delay where we are behind? We only count
 	 * being behind if: a) We are not in recovery. b) There was a delay.
 	 * <and> c) We had room to send something.
 	 *
 	 */
 	if (bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK) {
 		int retval;
 
 		retval = bbr_process_timers(tp, bbr, cts, hpts_calling);
 		if (retval != 0) {
 			counter_u64_add(bbr_out_size[TCP_MSS_ACCT_ATIMER], 1);
 			/*
 			 * If timers want tcp_drop(), then pass error out,
 			 * otherwise suppress it.
 			 */
 			return (retval < 0 ? retval : 0);
 		}
 	}
 	bbr->rc_tp->t_flags2 &= ~TF2_MBUF_QUEUE_READY;
 	if (hpts_calling &&
 	    (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT)) {
 		bbr->r_ctl.rc_last_delay_val = 0;
 	}
 	bbr->r_timer_override = 0;
 	bbr->r_wanted_output = 0;
 	/*
 	 * For TFO connections in SYN_RECEIVED, only allow the initial
 	 * SYN|ACK and those sent by the retransmit timer.
 	 */
 	if (IS_FASTOPEN(tp->t_flags) &&
 	    ((tp->t_state == TCPS_SYN_RECEIVED) ||
 	     (tp->t_state == TCPS_SYN_SENT)) &&
 	    SEQ_GT(tp->snd_max, tp->snd_una) &&	/* initial SYN or SYN|ACK sent */
 	    (tp->t_rxtshift == 0)) {	/* not a retransmit */
 		len = 0;
 		goto just_return_nolock;
 	}
 	/*
 	 * Before sending anything check for a state update. For hpts
 	 * calling without input this is important. If its input calling
 	 * then this was already done.
 	 */
 	if (bbr->rc_use_google == 0)
 		bbr_check_bbr_for_state(bbr, cts, __LINE__, 0);
 again:
 	/*
 	 * If we've recently taken a timeout, snd_max will be greater than
 	 * snd_max. BBR in general does not pay much attention to snd_nxt
 	 * for historic reasons the persist timer still uses it. This means
 	 * we have to look at it. All retransmissions that are not persits
 	 * use the rsm that needs to be sent so snd_nxt is ignored. At the
 	 * end of this routine we pull snd_nxt always up to snd_max.
 	 */
 	doing_tlp = 0;
 #ifdef BBR_INVARIANTS
 	doing_retran_from = picked_up_retran = 0;
 #endif
 	error = 0;
 	tso = 0;
 	slot = 0;
 	mtu = 0;
 	sendwin = min(tp->snd_wnd, tp->snd_cwnd);
 	sb_offset = tp->snd_max - tp->snd_una;
 	flags = tcp_outflags[tp->t_state];
 	sack_rxmit = 0;
 	len = 0;
 	rsm = NULL;
 	if (flags & TH_RST) {
 		SOCKBUF_LOCK(sb);
 		goto send;
 	}
 recheck_resend:
 	while (bbr->r_ctl.rc_free_cnt < bbr_min_req_free) {
 		/* We need to always have one in reserve */
 		rsm = bbr_alloc(bbr);
 		if (rsm == NULL) {
 			error = ENOMEM;
 			/* Lie to get on the hpts */
 			tot_len = tp->t_maxseg;
 			if (hpts_calling)
 				/* Retry in a ms */
 				slot = 1001;
 			goto just_return_nolock;
 		}
 		TAILQ_INSERT_TAIL(&bbr->r_ctl.rc_free, rsm, r_next);
 		bbr->r_ctl.rc_free_cnt++;
 		rsm = NULL;
 	}
 	/* What do we send, a resend? */
 	if (bbr->r_ctl.rc_resend == NULL) {
 		/* Check for rack timeout */
 		bbr->r_ctl.rc_resend = bbr_check_recovery_mode(tp, bbr, cts);
 		if (bbr->r_ctl.rc_resend) {
 #ifdef BBR_INVARIANTS
 			picked_up_retran = 1;
 #endif
 			bbr_cong_signal(tp, NULL, CC_NDUPACK, bbr->r_ctl.rc_resend);
 		}
 	}
 	if (bbr->r_ctl.rc_resend) {
 		rsm = bbr->r_ctl.rc_resend;
 #ifdef BBR_INVARIANTS
 		doing_retran_from = 1;
 #endif
 		/* Remove any TLP flags its a RACK or T-O */
 		rsm->r_flags &= ~BBR_TLP;
 		bbr->r_ctl.rc_resend = NULL;
 		if (SEQ_LT(rsm->r_start, tp->snd_una)) {
 #ifdef BBR_INVARIANTS
 			panic("Huh, tp:%p bbr:%p rsm:%p start:%u < snd_una:%u\n",
 			    tp, bbr, rsm, rsm->r_start, tp->snd_una);
 			goto recheck_resend;
 #else
 			/* TSNH */
 			rsm = NULL;
 			goto recheck_resend;
 #endif
 		}
 		if (rsm->r_flags & BBR_HAS_SYN) {
 			/* Only retransmit a SYN by itself */
 			len = 0;
 			if ((flags & TH_SYN) == 0) {
 				/* Huh something is wrong */
 				rsm->r_start++;
 				if (rsm->r_start == rsm->r_end) {
 					/* Clean it up, somehow we missed the ack? */
 					bbr_log_syn(tp, NULL);
 				} else {
 					/* TFO with data? */
 					rsm->r_flags &= ~BBR_HAS_SYN;
 					len = rsm->r_end - rsm->r_start;
 				}
 			} else {
 				/* Retransmitting SYN */
 				rsm = NULL;
 				SOCKBUF_LOCK(sb);
 				goto send;
 			}
 		} else
 			len = rsm->r_end - rsm->r_start;
 		if ((bbr->rc_resends_use_tso == 0) &&
 		    (len > maxseg)) {
 			len = maxseg;
 			more_to_rxt = 1;
 		}
 		sb_offset = rsm->r_start - tp->snd_una;
 		if (len > 0) {
 			sack_rxmit = 1;
 			KMOD_TCPSTAT_INC(tcps_sack_rexmits);
 			KMOD_TCPSTAT_ADD(tcps_sack_rexmit_bytes,
 			    min(len, maxseg));
 		} else {
 			/* I dont think this can happen */
 			rsm = NULL;
 			goto recheck_resend;
 		}
 		BBR_STAT_INC(bbr_resends_set);
 	} else if (bbr->r_ctl.rc_tlp_send) {
 		/*
 		 * Tail loss probe
 		 */
 		doing_tlp = 1;
 		rsm = bbr->r_ctl.rc_tlp_send;
 		bbr->r_ctl.rc_tlp_send = NULL;
 		sack_rxmit = 1;
 		len = rsm->r_end - rsm->r_start;
 		if ((bbr->rc_resends_use_tso == 0) && (len > maxseg))
 			len = maxseg;
 
 		if (SEQ_GT(tp->snd_una, rsm->r_start)) {
 #ifdef BBR_INVARIANTS
 			panic("tp:%p bbc:%p snd_una:%u rsm:%p r_start:%u",
 			    tp, bbr, tp->snd_una, rsm, rsm->r_start);
 #else
 			/* TSNH */
 			rsm = NULL;
 			goto recheck_resend;
 #endif
 		}
 		sb_offset = rsm->r_start - tp->snd_una;
 		BBR_STAT_INC(bbr_tlp_set);
 	}
 	/*
 	 * Enforce a connection sendmap count limit if set
 	 * as long as we are not retransmiting.
 	 */
 	if ((rsm == NULL) &&
 	    (V_tcp_map_entries_limit > 0) &&
 	    (bbr->r_ctl.rc_num_maps_alloced >= V_tcp_map_entries_limit)) {
 		BBR_STAT_INC(bbr_alloc_limited);
 		if (!bbr->alloc_limit_reported) {
 			bbr->alloc_limit_reported = 1;
 			BBR_STAT_INC(bbr_alloc_limited_conns);
 		}
 		goto just_return_nolock;
 	}
 #ifdef BBR_INVARIANTS
 	if (rsm && SEQ_LT(rsm->r_start, tp->snd_una)) {
 		panic("tp:%p bbr:%p rsm:%p sb_offset:%u len:%u",
 		    tp, bbr, rsm, sb_offset, len);
 	}
 #endif
 	/*
 	 * Get standard flags, and add SYN or FIN if requested by 'hidden'
 	 * state flags.
 	 */
 	if (tp->t_flags & TF_NEEDFIN && (rsm == NULL))
 		flags |= TH_FIN;
 	if (tp->t_flags & TF_NEEDSYN)
 		flags |= TH_SYN;
 
 	if (rsm && (rsm->r_flags & BBR_HAS_FIN)) {
 		/* we are retransmitting the fin */
 		len--;
 		if (len) {
 			/*
 			 * When retransmitting data do *not* include the
 			 * FIN. This could happen from a TLP probe if we
 			 * allowed data with a FIN.
 			 */
 			flags &= ~TH_FIN;
 		}
 	} else if (rsm) {
 		if (flags & TH_FIN)
 			flags &= ~TH_FIN;
 	}
 	if ((sack_rxmit == 0) && (prefetch_rsm == 0)) {
 		void *end_rsm;
 
 		end_rsm = TAILQ_LAST_FAST(&bbr->r_ctl.rc_tmap, bbr_sendmap, r_tnext);
 		if (end_rsm)
 			kern_prefetch(end_rsm, &prefetch_rsm);
 		prefetch_rsm = 1;
 	}
 	SOCKBUF_LOCK(sb);
 	/*
 	 * If snd_nxt == snd_max and we have transmitted a FIN, the
 	 * sb_offset will be > 0 even if so_snd.sb_cc is 0, resulting in a
 	 * negative length.  This can also occur when TCP opens up its
 	 * congestion window while receiving additional duplicate acks after
 	 * fast-retransmit because TCP will reset snd_nxt to snd_max after
 	 * the fast-retransmit.
 	 *
 	 * In the normal retransmit-FIN-only case, however, snd_nxt will be
 	 * set to snd_una, the sb_offset will be 0, and the length may wind
 	 * up 0.
 	 *
 	 * If sack_rxmit is true we are retransmitting from the scoreboard
 	 * in which case len is already set.
 	 */
 	if (sack_rxmit == 0) {
 		uint32_t avail;
 
 		avail = sbavail(sb);
 		if (SEQ_GT(tp->snd_max, tp->snd_una))
 			sb_offset = tp->snd_max - tp->snd_una;
 		else
 			sb_offset = 0;
 		if (bbr->rc_tlp_new_data) {
 			/* TLP is forcing out new data */
 			uint32_t tlplen;
 
 			doing_tlp = 1;
 			tlplen = maxseg;
 
 			if (tlplen > (uint32_t)(avail - sb_offset)) {
 				tlplen = (uint32_t)(avail - sb_offset);
 			}
 			if (tlplen > tp->snd_wnd) {
 				len = tp->snd_wnd;
 			} else {
 				len = tlplen;
 			}
 			bbr->rc_tlp_new_data = 0;
 		} else {
 			len = bbr_what_can_we_send(tp, bbr, sendwin, avail, sb_offset, cts);
 			if ((len < p_maxseg) &&
 			    (bbr->rc_in_persist == 0) &&
 			    (ctf_outstanding(tp) >= (2 * p_maxseg)) &&
 			    ((avail - sb_offset) >= p_maxseg)) {
 				/*
 				 * We are not completing whats in the socket
 				 * buffer (i.e. there is at least a segment
 				 * waiting to send) and we have 2 or more
 				 * segments outstanding. There is no sense
 				 * of sending a little piece. Lets defer and
 				 * and wait until we can send a whole
 				 * segment.
 				 */
 				len = 0;
 			}
 			if (bbr->rc_in_persist) {
 				/*
 				 * We are in persists, figure out if
 				 * a retransmit is available (maybe the previous
 				 * persists we sent) or if we have to send new
 				 * data.
 				 */
 				rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 				if (rsm) {
 					len = rsm->r_end - rsm->r_start;
 					if (rsm->r_flags & BBR_HAS_FIN)
 						len--;
 					if ((bbr->rc_resends_use_tso == 0) && (len > maxseg))
 						len = maxseg;
 					if (len > 1)
 						BBR_STAT_INC(bbr_persist_reneg);
 					/*
 					 * XXXrrs we could force the len to
 					 * 1 byte here to cause the chunk to
 					 * split apart.. but that would then
 					 * mean we always retransmit it as
 					 * one byte even after the window
 					 * opens.
 					 */
 					sack_rxmit = 1;
 					sb_offset = rsm->r_start - tp->snd_una;
 				} else {
 					/*
 					 * First time through in persists or peer
 					 * acked our one byte. Though we do have
 					 * to have something in the sb.
 					 */
 					len = 1;
 					sb_offset = 0;
 					if (avail == 0)
 					    len = 0;
 				}
 			}
 		}
 	}
 	if (prefetch_so_done == 0) {
 		kern_prefetch(so, &prefetch_so_done);
 		prefetch_so_done = 1;
 	}
 	/*
 	 * Lop off SYN bit if it has already been sent.  However, if this is
 	 * SYN-SENT state and if segment contains data and if we don't know
 	 * that foreign host supports TAO, suppress sending segment.
 	 */
 	if ((flags & TH_SYN) && (rsm == NULL) &&
 	    SEQ_GT(tp->snd_max, tp->snd_una)) {
 		if (tp->t_state != TCPS_SYN_RECEIVED)
 			flags &= ~TH_SYN;
 		/*
 		 * When sending additional segments following a TFO SYN|ACK,
 		 * do not include the SYN bit.
 		 */
 		if (IS_FASTOPEN(tp->t_flags) &&
 		    (tp->t_state == TCPS_SYN_RECEIVED))
 			flags &= ~TH_SYN;
 		sb_offset--, len++;
 		if (sbavail(sb) == 0)
 			len = 0;
 	} else if ((flags & TH_SYN) && rsm) {
 		/*
 		 * Subtract one from the len for the SYN being
 		 * retransmitted.
 		 */
 		len--;
 	}
 	/*
 	 * Be careful not to send data and/or FIN on SYN segments. This
 	 * measure is needed to prevent interoperability problems with not
 	 * fully conformant TCP implementations.
 	 */
 	if ((flags & TH_SYN) && (tp->t_flags & TF_NOOPT)) {
 		len = 0;
 		flags &= ~TH_FIN;
 	}
 	/*
 	 * On TFO sockets, ensure no data is sent in the following cases:
 	 *
 	 *  - When retransmitting SYN|ACK on a passively-created socket
 	 *  - When retransmitting SYN on an actively created socket
 	 *  - When sending a zero-length cookie (cookie request) on an
 	 *    actively created socket
 	 *  - When the socket is in the CLOSED state (RST is being sent)
 	 */
 	if (IS_FASTOPEN(tp->t_flags) &&
 	    (((flags & TH_SYN) && (tp->t_rxtshift > 0)) ||
 	     ((tp->t_state == TCPS_SYN_SENT) &&
 	      (tp->t_tfo_client_cookie_len == 0)) ||
 	     (flags & TH_RST))) {
 		len = 0;
 		sack_rxmit = 0;
 		rsm = NULL;
 	}
 	/* Without fast-open there should never be data sent on a SYN */
 	if ((flags & TH_SYN) && (!IS_FASTOPEN(tp->t_flags)))
 		len = 0;
 	if (len <= 0) {
 		/*
 		 * If FIN has been sent but not acked, but we haven't been
 		 * called to retransmit, len will be < 0.  Otherwise, window
 		 * shrank after we sent into it.  If window shrank to 0,
 		 * cancel pending retransmit, pull snd_nxt back to (closed)
 		 * window, and set the persist timer if it isn't already
 		 * going.  If the window didn't close completely, just wait
 		 * for an ACK.
 		 *
 		 * We also do a general check here to ensure that we will
 		 * set the persist timer when we have data to send, but a
 		 * 0-byte window. This makes sure the persist timer is set
 		 * even if the packet hits one of the "goto send" lines
 		 * below.
 		 */
 		len = 0;
 		if ((tp->snd_wnd == 0) &&
 		    (TCPS_HAVEESTABLISHED(tp->t_state)) &&
 		    (tp->snd_una == tp->snd_max) &&
 		    (sb_offset < (int)sbavail(sb))) {
 			/*
 			 * Not enough room in the rwnd to send
 			 * a paced segment out.
 			 */
 			bbr_enter_persist(tp, bbr, cts, __LINE__);
 		}
 	} else if ((rsm == NULL) &&
 		   (doing_tlp == 0) &&
 		   (len < bbr->r_ctl.rc_pace_max_segs)) {
 		/*
 		 * We are not sending a full segment for
 		 * some reason. Should we not send anything (think
 		 * sws or persists)?
 		 */
 		if ((tp->snd_wnd < min((bbr->r_ctl.rc_high_rwnd/2), bbr_minseg(bbr))) &&
 		    (TCPS_HAVEESTABLISHED(tp->t_state)) &&
 		    (len < (int)(sbavail(sb) - sb_offset))) {
 			/*
 			 * Here the rwnd is less than
 			 * the pacing size, this is not a retransmit,
 			 * we are established and
 			 * the send is not the last in the socket buffer
 			 * lets not send, and possibly enter persists.
 			 */
 			len = 0;
 			if (tp->snd_max == tp->snd_una)
 				bbr_enter_persist(tp, bbr, cts, __LINE__);
 		} else if ((tp->snd_cwnd >= bbr->r_ctl.rc_pace_max_segs) &&
 			   (ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 						 bbr->r_ctl.rc_lost_bytes)) > (2 * maxseg)) &&
 			   (len < (int)(sbavail(sb) - sb_offset)) &&
 			   (len < bbr_minseg(bbr))) {
 			/*
 			 * Here we are not retransmitting, and
 			 * the cwnd is not so small that we could
 			 * not send at least a min size (rxt timer
 			 * not having gone off), We have 2 segments or
 			 * more already in flight, its not the tail end
 			 * of the socket buffer  and the cwnd is blocking
 			 * us from sending out minimum pacing segment size.
 			 * Lets not send anything.
 			 */
 			bbr->rc_cwnd_limited = 1;
 			len = 0;
 		} else if (((tp->snd_wnd - ctf_outstanding(tp)) <
 			    min((bbr->r_ctl.rc_high_rwnd/2), bbr_minseg(bbr))) &&
 			   (ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 						 bbr->r_ctl.rc_lost_bytes)) > (2 * maxseg)) &&
 			   (len < (int)(sbavail(sb) - sb_offset)) &&
 			   (TCPS_HAVEESTABLISHED(tp->t_state))) {
 			/*
 			 * Here we have a send window but we have
 			 * filled it up and we can't send another pacing segment.
 			 * We also have in flight more than 2 segments
 			 * and we are not completing the sb i.e. we allow
 			 * the last bytes of the sb to go out even if
 			 * its not a full pacing segment.
 			 */
 			len = 0;
 		}
 	}
 	/* len will be >= 0 after this point. */
 	KASSERT(len >= 0, ("[%s:%d]: len < 0", __func__, __LINE__));
 	tcp_sndbuf_autoscale(tp, so, sendwin);
 	/*
 	 *
 	 */
 	if (bbr->rc_in_persist &&
 	    len &&
 	    (rsm == NULL) &&
 	    (len < min((bbr->r_ctl.rc_high_rwnd/2), bbr->r_ctl.rc_pace_max_segs))) {
 		/*
 		 * We are in persist, not doing a retransmit and don't have enough space
 		 * yet to send a full TSO. So is it at the end of the sb
 		 * if so we need to send else nuke to 0 and don't send.
 		 */
 		int sbleft;
 		if (sbavail(sb) > sb_offset)
 			sbleft = sbavail(sb) - sb_offset;
 		else
 			sbleft = 0;
 		if (sbleft >= min((bbr->r_ctl.rc_high_rwnd/2), bbr->r_ctl.rc_pace_max_segs)) {
 			/* not at end of sb lets not send */
 			len = 0;
 		}
 	}
 	/*
 	 * Decide if we can use TCP Segmentation Offloading (if supported by
 	 * hardware).
 	 *
 	 * TSO may only be used if we are in a pure bulk sending state.  The
 	 * presence of TCP-MD5, SACK retransmits, SACK advertizements and IP
 	 * options prevent using TSO.  With TSO the TCP header is the same
 	 * (except for the sequence number) for all generated packets.  This
 	 * makes it impossible to transmit any options which vary per
 	 * generated segment or packet.
 	 *
 	 * IPv4 handling has a clear separation of ip options and ip header
 	 * flags while IPv6 combines both in in6p_outputopts. ip6_optlen()
 	 * does the right thing below to provide length of just ip options
 	 * and thus checking for ipoptlen is enough to decide if ip options
 	 * are present.
 	 */
 #ifdef INET6
 	if (isipv6)
 		ipoptlen = ip6_optlen(inp);
 	else
 #endif
 	if (inp->inp_options)
 		ipoptlen = inp->inp_options->m_len -
 		    offsetof(struct ipoption, ipopt_list);
 	else
 		ipoptlen = 0;
 #if defined(IPSEC) || defined(IPSEC_SUPPORT)
 	/*
 	 * Pre-calculate here as we save another lookup into the darknesses
 	 * of IPsec that way and can actually decide if TSO is ok.
 	 */
 #ifdef INET6
 	if (isipv6 && IPSEC_ENABLED(ipv6))
 		ipsec_optlen = IPSEC_HDRSIZE(ipv6, inp);
 #ifdef INET
 	else
 #endif
 #endif				/* INET6 */
 #ifdef INET
 	if (IPSEC_ENABLED(ipv4))
 		ipsec_optlen = IPSEC_HDRSIZE(ipv4, inp);
 #endif				/* INET */
 #endif				/* IPSEC */
 #if defined(IPSEC) || defined(IPSEC_SUPPORT)
 	ipoptlen += ipsec_optlen;
 #endif
 	if ((tp->t_flags & TF_TSO) && V_tcp_do_tso &&
 	    (len > maxseg) &&
 	    (tp->t_port == 0) &&
 	    ((tp->t_flags & TF_SIGNATURE) == 0) &&
 	    tp->rcv_numsacks == 0 &&
 	    ipoptlen == 0)
 		tso = 1;
 
 	recwin = lmin(lmax(sbspace(&so->so_rcv), 0),
 	    (long)TCP_MAXWIN << tp->rcv_scale);
 	/*
 	 * Sender silly window avoidance.   We transmit under the following
 	 * conditions when len is non-zero:
 	 *
 	 * - We have a full segment (or more with TSO) - This is the last
 	 * buffer in a write()/send() and we are either idle or running
 	 * NODELAY - we've timed out (e.g. persist timer) - we have more
 	 * then 1/2 the maximum send window's worth of data (receiver may be
 	 * limited the window size) - we need to retransmit
 	 */
 	if (rsm)
 		goto send;
 	if (len) {
 		if (sack_rxmit)
 			goto send;
 		if (len >= p_maxseg)
 			goto send;
 		/*
 		 * NOTE! on localhost connections an 'ack' from the remote
 		 * end may occur synchronously with the output and cause us
 		 * to flush a buffer queued with moretocome.  XXX
 		 *
 		 */
 		if (((tp->t_flags & TF_MORETOCOME) == 0) &&	/* normal case */
 		    ((tp->t_flags & TF_NODELAY) ||
 		    ((uint32_t)len + (uint32_t)sb_offset) >= sbavail(&so->so_snd)) &&
 		    (tp->t_flags & TF_NOPUSH) == 0) {
 			goto send;
 		}
 		if ((tp->snd_una == tp->snd_max) && len) {	/* Nothing outstanding */
 			goto send;
 		}
 		if (len >= tp->max_sndwnd / 2 && tp->max_sndwnd > 0) {
 			goto send;
 		}
 	}
 	/*
 	 * Sending of standalone window updates.
 	 *
 	 * Window updates are important when we close our window due to a
 	 * full socket buffer and are opening it again after the application
 	 * reads data from it.  Once the window has opened again and the
 	 * remote end starts to send again the ACK clock takes over and
 	 * provides the most current window information.
 	 *
 	 * We must avoid the silly window syndrome whereas every read from
 	 * the receive buffer, no matter how small, causes a window update
 	 * to be sent.  We also should avoid sending a flurry of window
 	 * updates when the socket buffer had queued a lot of data and the
 	 * application is doing small reads.
 	 *
 	 * Prevent a flurry of pointless window updates by only sending an
 	 * update when we can increase the advertized window by more than
 	 * 1/4th of the socket buffer capacity.  When the buffer is getting
 	 * full or is very small be more aggressive and send an update
 	 * whenever we can increase by two mss sized segments. In all other
 	 * situations the ACK's to new incoming data will carry further
 	 * window increases.
 	 *
 	 * Don't send an independent window update if a delayed ACK is
 	 * pending (it will get piggy-backed on it) or the remote side
 	 * already has done a half-close and won't send more data.  Skip
 	 * this if the connection is in T/TCP half-open state.
 	 */
 	if (recwin > 0 && !(tp->t_flags & TF_NEEDSYN) &&
 	    !(tp->t_flags & TF_DELACK) &&
 	    !TCPS_HAVERCVDFIN(tp->t_state)) {
 		/* Check to see if we should do a window update */
 		if (bbr_window_update_needed(tp, so, recwin, maxseg))
 			goto send;
 	}
 	/*
 	 * Send if we owe the peer an ACK, RST, SYN.  ACKNOW
 	 * is also a catch-all for the retransmit timer timeout case.
 	 */
 	if (tp->t_flags & TF_ACKNOW) {
 		goto send;
 	}
 	if (flags & TH_RST) {
 		/* Always send a RST if one is due */
 		goto send;
 	}
 	if ((flags & TH_SYN) && (tp->t_flags & TF_NEEDSYN) == 0) {
 		goto send;
 	}
 	/*
 	 * If our state indicates that FIN should be sent and we have not
 	 * yet done so, then we need to send.
 	 */
 	if (flags & TH_FIN &&
 	    ((tp->t_flags & TF_SENTFIN) == 0)) {
 		goto send;
 	}
 	/*
 	 * No reason to send a segment, just return.
 	 */
 just_return:
 	SOCKBUF_UNLOCK(sb);
 just_return_nolock:
 	if (tot_len)
 		slot = bbr_get_pacing_delay(bbr, bbr->r_ctl.rc_bbr_hptsi_gain, tot_len, cts, 0);
 	if (bbr->rc_no_pacing)
 		slot = 0;
 	if (tot_len == 0) {
 		if ((ctf_outstanding(tp) + min((bbr->r_ctl.rc_high_rwnd/2), bbr_minseg(bbr))) >=
 		    tp->snd_wnd) {
 			BBR_STAT_INC(bbr_rwnd_limited);
 			app_limited = BBR_JR_RWND_LIMITED;
 			bbr_cwnd_limiting(tp, bbr, ctf_outstanding(tp));
 			if ((bbr->rc_in_persist == 0) &&
 			    TCPS_HAVEESTABLISHED(tp->t_state) &&
 			    (tp->snd_max == tp->snd_una) &&
 			    sbavail(&so->so_snd)) {
 				/* No send window.. we must enter persist */
 				bbr_enter_persist(tp, bbr, bbr->r_ctl.rc_rcvtime, __LINE__);
 			}
 		} else if (ctf_outstanding(tp) >= sbavail(sb)) {
 			BBR_STAT_INC(bbr_app_limited);
 			app_limited = BBR_JR_APP_LIMITED;
 			bbr_cwnd_limiting(tp, bbr, ctf_outstanding(tp));
 		} else if ((ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 						 bbr->r_ctl.rc_lost_bytes)) + p_maxseg) >= tp->snd_cwnd) {
 			BBR_STAT_INC(bbr_cwnd_limited);
  			app_limited = BBR_JR_CWND_LIMITED;
 			bbr_cwnd_limiting(tp, bbr, ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 									bbr->r_ctl.rc_lost_bytes)));
 			bbr->rc_cwnd_limited = 1;
 		} else {
 			BBR_STAT_INC(bbr_app_limited);
 			app_limited = BBR_JR_APP_LIMITED;
 			bbr_cwnd_limiting(tp, bbr, ctf_outstanding(tp));
 		}
 		bbr->r_ctl.rc_hptsi_agg_delay = 0;
 		bbr->r_agg_early_set = 0;
 		bbr->r_ctl.rc_agg_early = 0;
 		bbr->r_ctl.rc_last_delay_val = 0;
 	} else if (bbr->rc_use_google == 0)
 		bbr_check_bbr_for_state(bbr, cts, __LINE__, 0);
 	/* Are we app limited? */
 	if ((app_limited == BBR_JR_APP_LIMITED) ||
 	    (app_limited == BBR_JR_RWND_LIMITED)) {
 		/**
 		 * We are application limited.
 		 */
 		bbr->r_ctl.r_app_limited_until = (ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 								       bbr->r_ctl.rc_lost_bytes)) + bbr->r_ctl.rc_delivered);
 	}
 	if (tot_len == 0)
 		counter_u64_add(bbr_out_size[TCP_MSS_ACCT_JUSTRET], 1);
 	/* Dont update the time if we did not send */
 	bbr->r_ctl.rc_last_delay_val = 0;
 	bbr->rc_output_starts_timer = 1;
 	bbr_start_hpts_timer(bbr, tp, cts, 9, slot, tot_len);
 	bbr_log_type_just_return(bbr, cts, tot_len, hpts_calling, app_limited, p_maxseg, len);
 	if (SEQ_LT(tp->snd_nxt, tp->snd_max)) {
 		/* Make sure snd_nxt is drug up */
 		tp->snd_nxt = tp->snd_max;
 	}
 	return (error);
 
 send:
 	if (doing_tlp == 0) {
 		/*
 		 * Data not a TLP, and its not the rxt firing. If it is the
 		 * rxt firing, we want to leave the tlp_in_progress flag on
 		 * so we don't send another TLP. It has to be a rack timer
 		 * or normal send (response to acked data) to clear the tlp
 		 * in progress flag.
 		 */
 		bbr->rc_tlp_in_progress = 0;
 		bbr->rc_tlp_rtx_out = 0;
 	} else {
 		/*
 		 * Its a TLP.
 		 */
 		bbr->rc_tlp_in_progress = 1;
 	}
 	bbr_timer_cancel(bbr, __LINE__, cts);
 	if (rsm == NULL) {
 		if (sbused(sb) > 0) {
 			/*
 			 * This is sub-optimal. We only send a stand alone
 			 * FIN on its own segment.
 			 */
 			if (flags & TH_FIN) {
 				flags &= ~TH_FIN;
 				if ((len == 0) && ((tp->t_flags & TF_ACKNOW) == 0)) {
 					/* Lets not send this */
 					slot = 0;
 					goto just_return;
 				}
 			}
 		}
 	} else {
 		/*
 		 * We do *not* send a FIN on a retransmit if it has data.
 		 * The if clause here where len > 1 should never come true.
 		 */
 		if ((len > 0) &&
 		    (((rsm->r_flags & BBR_HAS_FIN) == 0) &&
 		    (flags & TH_FIN))) {
 			flags &= ~TH_FIN;
 			len--;
 		}
 	}
 	SOCKBUF_LOCK_ASSERT(sb);
 	if (len > 0) {
 		if ((tp->snd_una == tp->snd_max) &&
 		    (bbr_calc_time(cts, bbr->r_ctl.rc_went_idle_time) >= bbr_rtt_probe_time)) {
 			/*
 			 * This qualifies as a RTT_PROBE session since we
 			 * drop the data outstanding to nothing and waited
 			 * more than bbr_rtt_probe_time.
 			 */
 			bbr_log_rtt_shrinks(bbr, cts, 0, 0, __LINE__, BBR_RTTS_WASIDLE, 0);
 			bbr_set_reduced_rtt(bbr, cts, __LINE__);
 		}
 		if (len >= maxseg)
 			tp->t_flags2 |= TF2_PLPMTU_MAXSEGSNT;
 		else
 			tp->t_flags2 &= ~TF2_PLPMTU_MAXSEGSNT;
 	}
 	/*
 	 * Before ESTABLISHED, force sending of initial options unless TCP
 	 * set not to do any options. NOTE: we assume that the IP/TCP header
 	 * plus TCP options always fit in a single mbuf, leaving room for a
 	 * maximum link header, i.e. max_linkhdr + sizeof (struct tcpiphdr)
 	 * + optlen <= MCLBYTES
 	 */
 	optlen = 0;
 #ifdef INET6
 	if (isipv6)
 		hdrlen = sizeof(struct ip6_hdr) + sizeof(struct tcphdr);
 	else
 #endif
 		hdrlen = sizeof(struct tcpiphdr);
 
 	/*
 	 * Compute options for segment. We only have to care about SYN and
 	 * established connection segments.  Options for SYN-ACK segments
 	 * are handled in TCP syncache.
 	 */
 	to.to_flags = 0;
 	local_options = 0;
 	if ((tp->t_flags & TF_NOOPT) == 0) {
 		/* Maximum segment size. */
 		if (flags & TH_SYN) {
 			to.to_mss = tcp_mssopt(&inp->inp_inc);
 			if (tp->t_port)
 				to.to_mss -= V_tcp_udp_tunneling_overhead;
 			to.to_flags |= TOF_MSS;
 			/*
 			 * On SYN or SYN|ACK transmits on TFO connections,
 			 * only include the TFO option if it is not a
 			 * retransmit, as the presence of the TFO option may
 			 * have caused the original SYN or SYN|ACK to have
 			 * been dropped by a middlebox.
 			 */
 			if (IS_FASTOPEN(tp->t_flags) &&
 			    (tp->t_rxtshift == 0)) {
 				if (tp->t_state == TCPS_SYN_RECEIVED) {
 					to.to_tfo_len = TCP_FASTOPEN_COOKIE_LEN;
 					to.to_tfo_cookie =
 					    (u_int8_t *)&tp->t_tfo_cookie.server;
 					to.to_flags |= TOF_FASTOPEN;
 					wanted_cookie = 1;
 				} else if (tp->t_state == TCPS_SYN_SENT) {
 					to.to_tfo_len =
 					    tp->t_tfo_client_cookie_len;
 					to.to_tfo_cookie =
 					    tp->t_tfo_cookie.client;
 					to.to_flags |= TOF_FASTOPEN;
 					wanted_cookie = 1;
 				}
 			}
 		}
 		/* Window scaling. */
 		if ((flags & TH_SYN) && (tp->t_flags & TF_REQ_SCALE)) {
 			to.to_wscale = tp->request_r_scale;
 			to.to_flags |= TOF_SCALE;
 		}
 		/* Timestamps. */
 		if ((tp->t_flags & TF_RCVD_TSTMP) ||
 		    ((flags & TH_SYN) && (tp->t_flags & TF_REQ_TSTMP))) {
 			to.to_tsval = 	tcp_tv_to_mssectick(&bbr->rc_tv) + tp->ts_offset;
 			to.to_tsecr = tp->ts_recent;
 			to.to_flags |= TOF_TS;
 			local_options += TCPOLEN_TIMESTAMP + 2;
 		}
 		/* Set receive buffer autosizing timestamp. */
 		if (tp->rfbuf_ts == 0 &&
 		    (so->so_rcv.sb_flags & SB_AUTOSIZE))
 			tp->rfbuf_ts = 	tcp_tv_to_mssectick(&bbr->rc_tv);
 		/* Selective ACK's. */
 		if (flags & TH_SYN)
 			to.to_flags |= TOF_SACKPERM;
 		else if (TCPS_HAVEESTABLISHED(tp->t_state) &&
 		    tp->rcv_numsacks > 0) {
 			to.to_flags |= TOF_SACK;
 			to.to_nsacks = tp->rcv_numsacks;
 			to.to_sacks = (u_char *)tp->sackblks;
 		}
 #if defined(IPSEC_SUPPORT) || defined(TCP_SIGNATURE)
 		/* TCP-MD5 (RFC2385). */
 		if (tp->t_flags & TF_SIGNATURE)
 			to.to_flags |= TOF_SIGNATURE;
 #endif				/* TCP_SIGNATURE */
 
 		/* Processing the options. */
 		hdrlen += (optlen = tcp_addoptions(&to, opt));
 		/*
 		 * If we wanted a TFO option to be added, but it was unable
 		 * to fit, ensure no data is sent.
 		 */
 		if (IS_FASTOPEN(tp->t_flags) && wanted_cookie &&
 		    !(to.to_flags & TOF_FASTOPEN))
 			len = 0;
 	}
 	if (tp->t_port) {
 		if (V_tcp_udp_tunneling_port == 0) {
 			/* The port was removed?? */
 			SOCKBUF_UNLOCK(&so->so_snd);
 			return (EHOSTUNREACH);
 		}
 		hdrlen += sizeof(struct udphdr);
 	}
 #ifdef INET6
 	if (isipv6)
 		ipoptlen = ip6_optlen(inp);
 	else
 #endif
 	if (inp->inp_options)
 		ipoptlen = inp->inp_options->m_len -
 		    offsetof(struct ipoption, ipopt_list);
 	else
 		ipoptlen = 0;
 	ipoptlen = 0;
 #if defined(IPSEC) || defined(IPSEC_SUPPORT)
 	ipoptlen += ipsec_optlen;
 #endif
 	if (bbr->rc_last_options != local_options) {
 		/*
 		 * Cache the options length this generally does not change
 		 * on a connection. We use this to calculate TSO.
 		 */
 		bbr->rc_last_options = local_options;
 	}
 	maxseg = tp->t_maxseg - (ipoptlen + optlen);
 	p_maxseg = min(maxseg, pace_max_segs);
 	/*
 	 * Adjust data length if insertion of options will bump the packet
 	 * length beyond the t_maxseg length. Clear the FIN bit because we
 	 * cut off the tail of the segment.
 	 */
 	if (len > maxseg) {
 		if (len != 0 && (flags & TH_FIN)) {
 			flags &= ~TH_FIN;
 		}
 		if (tso) {
 			uint32_t moff;
 			int32_t max_len;
 
 			/* extract TSO information */
 			if_hw_tsomax = tp->t_tsomax;
 			if_hw_tsomaxsegcount = tp->t_tsomaxsegcount;
 			if_hw_tsomaxsegsize = tp->t_tsomaxsegsize;
 			KASSERT(ipoptlen == 0,
 			    ("%s: TSO can't do IP options", __func__));
 
 			/*
 			 * Check if we should limit by maximum payload
 			 * length:
 			 */
 			if (if_hw_tsomax != 0) {
 				/* compute maximum TSO length */
 				max_len = (if_hw_tsomax - hdrlen -
 				    max_linkhdr);
 				if (max_len <= 0) {
 					len = 0;
 				} else if (len > max_len) {
 					len = max_len;
 				}
 			}
 			/*
 			 * Prevent the last segment from being fractional
 			 * unless the send sockbuf can be emptied:
 			 */
 			if ((sb_offset + len) < sbavail(sb)) {
 				moff = len % (uint32_t)maxseg;
 				if (moff != 0) {
 					len -= moff;
 				}
 			}
 			/*
 			 * In case there are too many small fragments don't
 			 * use TSO:
 			 */
 			if (len <= maxseg) {
 				len = maxseg;
 				tso = 0;
 			}
 		} else {
 			/* Not doing TSO */
 			if (optlen + ipoptlen >= tp->t_maxseg) {
 				/*
 				 * Since we don't have enough space to put
 				 * the IP header chain and the TCP header in
 				 * one packet as required by RFC 7112, don't
 				 * send it. Also ensure that at least one
 				 * byte of the payload can be put into the
 				 * TCP segment.
 				 */
 				SOCKBUF_UNLOCK(&so->so_snd);
 				error = EMSGSIZE;
 				sack_rxmit = 0;
 				goto out;
 			}
 			len = maxseg;
 		}
 	} else {
 		/* Not doing TSO */
 		if_hw_tsomaxsegcount = 0;
 		tso = 0;
 	}
 	KASSERT(len + hdrlen + ipoptlen <= IP_MAXPACKET,
 	    ("%s: len > IP_MAXPACKET", __func__));
 #ifdef DIAGNOSTIC
 #ifdef INET6
 	if (max_linkhdr + hdrlen > MCLBYTES)
 #else
 	if (max_linkhdr + hdrlen > MHLEN)
 #endif
 		panic("tcphdr too big");
 #endif
 	/*
 	 * This KASSERT is here to catch edge cases at a well defined place.
 	 * Before, those had triggered (random) panic conditions further
 	 * down.
 	 */
 #ifdef BBR_INVARIANTS
 	if (sack_rxmit) {
 		if (SEQ_LT(rsm->r_start, tp->snd_una)) {
 			panic("RSM:%p TP:%p bbr:%p start:%u is < snd_una:%u",
 			    rsm, tp, bbr, rsm->r_start, tp->snd_una);
 		}
 	}
 #endif
 	KASSERT(len >= 0, ("[%s:%d]: len < 0", __func__, __LINE__));
 	if ((len == 0) &&
 	    (flags & TH_FIN) &&
 	    (sbused(sb))) {
 		/*
 		 * We have outstanding data, don't send a fin by itself!.
 		 */
 		slot = 0;
 		goto just_return;
 	}
 	/*
 	 * Grab a header mbuf, attaching a copy of data to be transmitted,
 	 * and initialize the header from the template for sends on this
 	 * connection.
 	 */
 	if (len) {
 		uint32_t moff;
 
 		/*
 		 * We place a limit on sending with hptsi.
 		 */
 		if ((rsm == NULL) && len > pace_max_segs)
 			len = pace_max_segs;
 		if (len <= maxseg)
 			tso = 0;
 #ifdef INET6
 		if (MHLEN < hdrlen + max_linkhdr)
 			m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
 		else
 #endif
 			m = m_gethdr(M_NOWAIT, MT_DATA);
 
 		if (m == NULL) {
 			BBR_STAT_INC(bbr_failed_mbuf_aloc);
 			bbr_log_enobuf_jmp(bbr, len, cts, __LINE__, len, 0, 0);
 			SOCKBUF_UNLOCK(sb);
 			error = ENOBUFS;
 			sack_rxmit = 0;
 			goto out;
 		}
 		m->m_data += max_linkhdr;
 		m->m_len = hdrlen;
 		/*
 		 * Start the m_copy functions from the closest mbuf to the
 		 * sb_offset in the socket buffer chain.
 		 */
 		if ((sb_offset > sbavail(sb)) || ((len + sb_offset) > sbavail(sb))) {
 #ifdef BBR_INVARIANTS
 			if ((len + sb_offset) > (sbavail(sb) + ((flags & (TH_FIN | TH_SYN)) ? 1 : 0)))
 				panic("tp:%p bbr:%p len:%u sb_offset:%u sbavail:%u rsm:%p %u:%u:%u",
 				    tp, bbr, len, sb_offset, sbavail(sb), rsm,
 				    doing_retran_from,
 				    picked_up_retran,
 				    doing_tlp);
 
 #endif
 			/*
 			 * In this messed up situation we have two choices,
 			 * a) pretend the send worked, and just start timers
 			 * and what not (not good since that may lead us
 			 * back here a lot). <or> b) Send the lowest segment
 			 * in the map. <or> c) Drop the connection. Lets do
 			 * <b> which if it continues to happen will lead to
 			 * <c> via timeouts.
 			 */
 			BBR_STAT_INC(bbr_offset_recovery);
 			rsm = TAILQ_FIRST(&bbr->r_ctl.rc_map);
 			sb_offset = 0;
 			if (rsm == NULL) {
 				sack_rxmit = 0;
 				len = sbavail(sb);
 			} else {
 				sack_rxmit = 1;
 				if (rsm->r_start != tp->snd_una) {
 					/*
 					 * Things are really messed up, <c>
 					 * is the only thing to do.
 					 */
 					BBR_STAT_INC(bbr_offset_drop);
 					SOCKBUF_UNLOCK(sb);
 					(void)m_free(m);
 					return (-EFAULT); /* tcp_drop() */
 				}
 				len = rsm->r_end - rsm->r_start;
 			}
 			if (len > sbavail(sb))
 				len = sbavail(sb);
 			if (len > maxseg)
 				len = maxseg;
 		}
 		mb = sbsndptr_noadv(sb, sb_offset, &moff);
 		if (len <= MHLEN - hdrlen - max_linkhdr && !hw_tls) {
 			m_copydata(mb, moff, (int)len,
 			    mtod(m, caddr_t)+hdrlen);
 			if (rsm == NULL)
 				sbsndptr_adv(sb, mb, len);
 			m->m_len += len;
 		} else {
 			struct sockbuf *msb;
 
 			if (rsm)
 				msb = NULL;
 			else
 				msb = sb;
 #ifdef BBR_INVARIANTS
 			if ((len + moff) > (sbavail(sb) + ((flags & (TH_FIN | TH_SYN)) ? 1 : 0))) {
 				if (rsm) {
 					panic("tp:%p bbr:%p len:%u moff:%u sbavail:%u rsm:%p snd_una:%u rsm_start:%u flg:%x %u:%u:%u sr:%d ",
 					    tp, bbr, len, moff,
 					    sbavail(sb), rsm,
 					    tp->snd_una, rsm->r_flags, rsm->r_start,
 					    doing_retran_from,
 					    picked_up_retran,
 					    doing_tlp, sack_rxmit);
 				} else {
 					panic("tp:%p bbr:%p len:%u moff:%u sbavail:%u sb_offset:%u snd_una:%u",
 					    tp, bbr, len, moff, sbavail(sb), sb_offset, tp->snd_una);
 				}
 			}
 #endif
 			m->m_next = tcp_m_copym(
 				mb, moff, &len,
 				if_hw_tsomaxsegcount,
 				if_hw_tsomaxsegsize, msb,
 				((rsm == NULL) ? hw_tls : 0)
 #ifdef NETFLIX_COPY_ARGS
 				, NULL, NULL
 #endif
 				);
 			if (len <= maxseg) {
 				/*
 				 * Must have ran out of mbufs for the copy
 				 * shorten it to no longer need tso. Lets
 				 * not put on sendalot since we are low on
 				 * mbufs.
 				 */
 				tso = 0;
 			}
 			if (m->m_next == NULL) {
 				SOCKBUF_UNLOCK(sb);
 				(void)m_free(m);
 				error = ENOBUFS;
 				sack_rxmit = 0;
 				goto out;
 			}
 		}
 #ifdef BBR_INVARIANTS
 		if (tso && len < maxseg) {
 			panic("tp:%p tso on, but len:%d < maxseg:%d",
 			    tp, len, maxseg);
 		}
 		if (tso && if_hw_tsomaxsegcount) {
 			int32_t seg_cnt = 0;
 			struct mbuf *foo;
 
 			foo = m;
 			while (foo) {
 				seg_cnt++;
 				foo = foo->m_next;
 			}
 			if (seg_cnt > if_hw_tsomaxsegcount) {
 				panic("seg_cnt:%d > max:%d", seg_cnt, if_hw_tsomaxsegcount);
 			}
 		}
 #endif
 		/*
 		 * If we're sending everything we've got, set PUSH. (This
 		 * will keep happy those implementations which only give
 		 * data to the user when a buffer fills or a PUSH comes in.)
 		 */
 		if (sb_offset + len == sbused(sb) &&
 		    sbused(sb) &&
 		    !(flags & TH_SYN)) {
 			flags |= TH_PUSH;
 		}
 		SOCKBUF_UNLOCK(sb);
 	} else {
 		SOCKBUF_UNLOCK(sb);
 		if (tp->t_flags & TF_ACKNOW)
 			KMOD_TCPSTAT_INC(tcps_sndacks);
 		else if (flags & (TH_SYN | TH_FIN | TH_RST))
 			KMOD_TCPSTAT_INC(tcps_sndctrl);
 		else
 			KMOD_TCPSTAT_INC(tcps_sndwinup);
 
 		m = m_gethdr(M_NOWAIT, MT_DATA);
 		if (m == NULL) {
 			BBR_STAT_INC(bbr_failed_mbuf_aloc);
 			bbr_log_enobuf_jmp(bbr, len, cts, __LINE__, len, 0, 0);
 			error = ENOBUFS;
 			/* Fudge the send time since we could not send */
 			sack_rxmit = 0;
 			goto out;
 		}
 #ifdef INET6
 		if (isipv6 && (MHLEN < hdrlen + max_linkhdr) &&
 		    MHLEN >= hdrlen) {
 			M_ALIGN(m, hdrlen);
 		} else
 #endif
 			m->m_data += max_linkhdr;
 		m->m_len = hdrlen;
 	}
 	SOCKBUF_UNLOCK_ASSERT(sb);
 	m->m_pkthdr.rcvif = (struct ifnet *)0;
 #ifdef MAC
 	mac_inpcb_create_mbuf(inp, m);
 #endif
 #ifdef INET6
 	if (isipv6) {
 		ip6 = mtod(m, struct ip6_hdr *);
 		if (tp->t_port) {
 			udp = (struct udphdr *)((caddr_t)ip6 + sizeof(struct ip6_hdr));
 			udp->uh_sport = htons(V_tcp_udp_tunneling_port);
 			udp->uh_dport = tp->t_port;
 			ulen = hdrlen + len - sizeof(struct ip6_hdr);
 			udp->uh_ulen = htons(ulen);
 			th = (struct tcphdr *)(udp + 1);
 		} else {
 			th = (struct tcphdr *)(ip6 + 1);
 		}
 		tcpip_fillheaders(inp, tp->t_port, ip6, th);
 	} else
 #endif				/* INET6 */
 	{
 		ip = mtod(m, struct ip *);
 		if (tp->t_port) {
 			udp = (struct udphdr *)((caddr_t)ip + sizeof(struct ip));
 			udp->uh_sport = htons(V_tcp_udp_tunneling_port);
 			udp->uh_dport = tp->t_port;
 			ulen = hdrlen + len - sizeof(struct ip);
 			udp->uh_ulen = htons(ulen);
 			th = (struct tcphdr *)(udp + 1);
 		} else {
 			th = (struct tcphdr *)(ip + 1);
 		}
 		tcpip_fillheaders(inp, tp->t_port, ip, th);
 	}
 	/*
 	 * If we are doing retransmissions, then snd_nxt will not reflect
 	 * the first unsent octet.  For ACK only packets, we do not want the
 	 * sequence number of the retransmitted packet, we want the sequence
 	 * number of the next unsent octet.  So, if there is no data (and no
 	 * SYN or FIN), use snd_max instead of snd_nxt when filling in
 	 * ti_seq.  But if we are in persist state, snd_max might reflect
 	 * one byte beyond the right edge of the window, so use snd_nxt in
 	 * that case, since we know we aren't doing a retransmission.
 	 * (retransmit and persist are mutually exclusive...)
 	 */
 	if (sack_rxmit == 0) {
 		if (len && ((flags & (TH_FIN | TH_SYN | TH_RST)) == 0)) {
 			/* New data (including new persists) */
 			th->th_seq = htonl(tp->snd_max);
 			bbr_seq = tp->snd_max;
 		} else if (flags & TH_SYN) {
 			/* Syn's always send from iss */
 			th->th_seq = htonl(tp->iss);
 			bbr_seq = tp->iss;
 		} else if (flags & TH_FIN) {
 			if (flags & TH_FIN && tp->t_flags & TF_SENTFIN) {
 				/*
 				 * If we sent the fin already its 1 minus
 				 * snd_max
 				 */
 				th->th_seq = (htonl(tp->snd_max - 1));
 				bbr_seq = (tp->snd_max - 1);
 			} else {
 				/* First time FIN use snd_max */
 				th->th_seq = htonl(tp->snd_max);
 				bbr_seq = tp->snd_max;
 			}
 		} else {
 			/*
 			 * len == 0 and not persist we use snd_max, sending
 			 * an ack unless we have sent the fin then its 1
 			 * minus.
 			 */
 			/*
 			 * XXXRRS Question if we are in persists and we have
 			 * nothing outstanding to send and we have not sent
 			 * a FIN, we will send an ACK. In such a case it
 			 * might be better to send (tp->snd_una - 1) which
 			 * would force the peer to ack.
 			 */
 			if (tp->t_flags & TF_SENTFIN) {
 				th->th_seq = htonl(tp->snd_max - 1);
 				bbr_seq = (tp->snd_max - 1);
 			} else {
 				th->th_seq = htonl(tp->snd_max);
 				bbr_seq = tp->snd_max;
 			}
 		}
 	} else {
 		/* All retransmits use the rsm to guide the send */
 		th->th_seq = htonl(rsm->r_start);
 		bbr_seq = rsm->r_start;
 	}
 	th->th_ack = htonl(tp->rcv_nxt);
 	if (optlen) {
 		bcopy(opt, th + 1, optlen);
 		th->th_off = (sizeof(struct tcphdr) + optlen) >> 2;
 	}
 	tcp_set_flags(th, flags);
 	/*
 	 * Calculate receive window.  Don't shrink window, but avoid silly
 	 * window syndrome.
 	 */
 	if ((flags & TH_RST) || ((recwin < (so->so_rcv.sb_hiwat / 4) &&
 				  recwin < maxseg)))
 		recwin = 0;
 	if (SEQ_GT(tp->rcv_adv, tp->rcv_nxt) &&
 	    recwin < (tp->rcv_adv - tp->rcv_nxt))
 		recwin = (tp->rcv_adv - tp->rcv_nxt);
 	if (recwin > TCP_MAXWIN << tp->rcv_scale)
 		recwin = TCP_MAXWIN << tp->rcv_scale;
 
 	/*
 	 * According to RFC1323 the window field in a SYN (i.e., a <SYN> or
 	 * <SYN,ACK>) segment itself is never scaled.  The <SYN,ACK> case is
 	 * handled in syncache.
 	 */
 	if (flags & TH_SYN)
 		th->th_win = htons((u_short)
 		    (min(sbspace(&so->so_rcv), TCP_MAXWIN)));
 	else {
 		/* Avoid shrinking window with window scaling. */
 		recwin = roundup2(recwin, 1 << tp->rcv_scale);
 		th->th_win = htons((u_short)(recwin >> tp->rcv_scale));
 	}
 	/*
 	 * Adjust the RXWIN0SENT flag - indicate that we have advertised a 0
 	 * window.  This may cause the remote transmitter to stall.  This
 	 * flag tells soreceive() to disable delayed acknowledgements when
 	 * draining the buffer.  This can occur if the receiver is
 	 * attempting to read more data than can be buffered prior to
 	 * transmitting on the connection.
 	 */
 	if (th->th_win == 0) {
 		tp->t_sndzerowin++;
 		tp->t_flags |= TF_RXWIN0SENT;
 	} else
 		tp->t_flags &= ~TF_RXWIN0SENT;
 	/*
 	 * We don't support urgent data, but drag along
 	 * the pointer in case of a stack switch.
 	 */
 	tp->snd_up = tp->snd_una;
 
 #if defined(IPSEC_SUPPORT) || defined(TCP_SIGNATURE)
 	if (to.to_flags & TOF_SIGNATURE) {
 		/*
 		 * Calculate MD5 signature and put it into the place
 		 * determined before. NOTE: since TCP options buffer doesn't
 		 * point into mbuf's data, calculate offset and use it.
 		 */
 		if (!TCPMD5_ENABLED() || TCPMD5_OUTPUT(m, th,
 		    (u_char *)(th + 1) + (to.to_signature - opt)) != 0) {
 			/*
 			 * Do not send segment if the calculation of MD5
 			 * digest has failed.
 			 */
 			goto out;
 		}
 	}
 #endif
 
 	/*
 	 * Put TCP length in extended header, and then checksum extended
 	 * header and data.
 	 */
 	m->m_pkthdr.len = hdrlen + len;	/* in6_cksum() need this */
 #ifdef INET6
 	if (isipv6) {
 		/*
 		 * ip6_plen is not need to be filled now, and will be filled
 		 * in ip6_output.
 		 */
 		if (tp->t_port) {
 			m->m_pkthdr.csum_flags = CSUM_UDP_IPV6;
 			m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum);
 			udp->uh_sum = in6_cksum_pseudo(ip6, ulen, IPPROTO_UDP, 0);
 			th->th_sum = htons(0);
 			UDPSTAT_INC(udps_opackets);
 		} else {
 			csum_flags = m->m_pkthdr.csum_flags = CSUM_TCP_IPV6;
 			m->m_pkthdr.csum_data = offsetof(struct tcphdr, th_sum);
 			th->th_sum = in6_cksum_pseudo(ip6, sizeof(struct tcphdr) +
 			    optlen + len, IPPROTO_TCP, 0);
 		}
 	}
 #endif
 #if defined(INET6) && defined(INET)
 	else
 #endif
 #ifdef INET
 	{
 		if (tp->t_port) {
 			m->m_pkthdr.csum_flags = CSUM_UDP;
 			m->m_pkthdr.csum_data = offsetof(struct udphdr, uh_sum);
 			udp->uh_sum = in_pseudo(ip->ip_src.s_addr,
 			    ip->ip_dst.s_addr, htons(ulen + IPPROTO_UDP));
 			th->th_sum = htons(0);
 			UDPSTAT_INC(udps_opackets);
 		} else {
 			csum_flags = m->m_pkthdr.csum_flags = CSUM_TCP;
 			m->m_pkthdr.csum_data = offsetof(struct tcphdr, th_sum);
 			th->th_sum = in_pseudo(ip->ip_src.s_addr,
 			    ip->ip_dst.s_addr, htons(sizeof(struct tcphdr) +
 			    IPPROTO_TCP + len + optlen));
 		}
 		/* IP version must be set here for ipv4/ipv6 checking later */
 		KASSERT(ip->ip_v == IPVERSION,
 		    ("%s: IP version incorrect: %d", __func__, ip->ip_v));
 	}
 #endif
 
 	/*
 	 * Enable TSO and specify the size of the segments. The TCP pseudo
 	 * header checksum is always provided. XXX: Fixme: This is currently
 	 * not the case for IPv6.
 	 */
 	if (tso) {
 		KASSERT(len > maxseg,
 		    ("%s: len:%d <= tso_segsz:%d", __func__, len, maxseg));
 		m->m_pkthdr.csum_flags |= CSUM_TSO;
 		csum_flags |= CSUM_TSO;
 		m->m_pkthdr.tso_segsz = maxseg;
 	}
 	KASSERT(len + hdrlen == m_length(m, NULL),
 	    ("%s: mbuf chain different than expected: %d + %u != %u",
 	    __func__, len, hdrlen, m_length(m, NULL)));
 
 #ifdef TCP_HHOOK
 	/* Run HHOOK_TC_ESTABLISHED_OUT helper hooks. */
 	hhook_run_tcp_est_out(tp, th, &to, len, tso);
 #endif
 
 	/* Log to the black box */
 	if (tcp_bblogging_on(tp)) {
 		union tcp_log_stackspecific log;
 
 		bbr_fill_in_logging_data(bbr, &log.u_bbr, cts);
 		/* Record info on type of transmission */
 		log.u_bbr.flex1 = bbr->r_ctl.rc_hptsi_agg_delay;
 		log.u_bbr.flex2 = (bbr->r_recovery_bw << 3);
 		log.u_bbr.flex3 = maxseg;
 		log.u_bbr.flex4 = delay_calc;
 		log.u_bbr.flex5 = bbr->rc_past_init_win;
 		log.u_bbr.flex5 <<= 1;
 		log.u_bbr.flex5 |= bbr->rc_no_pacing;
 		log.u_bbr.flex5 <<= 29;
 		log.u_bbr.flex5 |= tp->t_maxseg;
 		log.u_bbr.flex6 = bbr->r_ctl.rc_pace_max_segs;
 		log.u_bbr.flex7 = (bbr->rc_bbr_state << 8) | bbr_state_val(bbr);
 		/* lets poke in the low and the high here for debugging */
 		log.u_bbr.pkts_out = bbr->rc_tp->t_maxseg;
 		if (rsm || sack_rxmit) {
 			if (doing_tlp)
 				log.u_bbr.flex8 = 2;
 			else
 				log.u_bbr.flex8 = 1;
 		} else {
 			log.u_bbr.flex8 = 0;
 		}
 		lgb = tcp_log_event(tp, th, &so->so_rcv, &so->so_snd, TCP_LOG_OUT, ERRNO_UNK,
 		    len, &log, false, NULL, NULL, 0, tv);
 	} else {
 		lgb = NULL;
 	}
 	/*
 	 * Fill in IP length and desired time to live and send to IP level.
 	 * There should be a better way to handle ttl and tos; we could keep
 	 * them in the template, but need a way to checksum without them.
 	 */
 	/*
 	 * m->m_pkthdr.len should have been set before cksum calcuration,
 	 * because in6_cksum() need it.
 	 */
 #ifdef INET6
 	if (isipv6) {
 		/*
 		 * we separately set hoplimit for every segment, since the
 		 * user might want to change the value via setsockopt. Also,
 		 * desired default hop limit might be changed via Neighbor
 		 * Discovery.
 		 */
 		ip6->ip6_hlim = in6_selecthlim(inp, NULL);
 
 		/*
 		 * Set the packet size here for the benefit of DTrace
 		 * probes. ip6_output() will set it properly; it's supposed
 		 * to include the option header lengths as well.
 		 */
 		ip6->ip6_plen = htons(m->m_pkthdr.len - sizeof(*ip6));
 
 		if (V_path_mtu_discovery && maxseg > V_tcp_minmss)
 			tp->t_flags2 |= TF2_PLPMTU_PMTUD;
 		else
 			tp->t_flags2 &= ~TF2_PLPMTU_PMTUD;
 
 		if (tp->t_state == TCPS_SYN_SENT)
 			TCP_PROBE5(connect__request, NULL, tp, ip6, tp, th);
 
 		TCP_PROBE5(send, NULL, tp, ip6, tp, th);
 		/* TODO: IPv6 IP6TOS_ECT bit on */
 		error = ip6_output(m, inp->in6p_outputopts,
 		    &inp->inp_route6,
 		    ((rsm || sack_rxmit) ? IP_NO_SND_TAG_RL : 0),
 		    NULL, NULL, inp);
 
 		if (error == EMSGSIZE && inp->inp_route6.ro_nh != NULL)
 			mtu = inp->inp_route6.ro_nh->nh_mtu;
 	}
 #endif				/* INET6 */
 #if defined(INET) && defined(INET6)
 	else
 #endif
 #ifdef INET
 	{
 		ip->ip_len = htons(m->m_pkthdr.len);
 #ifdef INET6
 		if (isipv6)
 			ip->ip_ttl = in6_selecthlim(inp, NULL);
 #endif				/* INET6 */
 		/*
 		 * If we do path MTU discovery, then we set DF on every
 		 * packet. This might not be the best thing to do according
 		 * to RFC3390 Section 2. However the tcp hostcache migitates
 		 * the problem so it affects only the first tcp connection
 		 * with a host.
 		 *
 		 * NB: Don't set DF on small MTU/MSS to have a safe
 		 * fallback.
 		 */
 		if (V_path_mtu_discovery && tp->t_maxseg > V_tcp_minmss) {
 			tp->t_flags2 |= TF2_PLPMTU_PMTUD;
 			if (tp->t_port == 0 || len < V_tcp_minmss) {
 				ip->ip_off |= htons(IP_DF);
 			}
 		} else {
 			tp->t_flags2 &= ~TF2_PLPMTU_PMTUD;
 		}
 
 		if (tp->t_state == TCPS_SYN_SENT)
 			TCP_PROBE5(connect__request, NULL, tp, ip, tp, th);
 
 		TCP_PROBE5(send, NULL, tp, ip, tp, th);
 
 		error = ip_output(m, inp->inp_options, &inp->inp_route,
 		    ((rsm || sack_rxmit) ? IP_NO_SND_TAG_RL : 0), 0,
 		    inp);
 		if (error == EMSGSIZE && inp->inp_route.ro_nh != NULL)
 			mtu = inp->inp_route.ro_nh->nh_mtu;
 	}
 #endif				/* INET */
 out:
 
 	if (lgb) {
 		lgb->tlb_errno = error;
 		lgb = NULL;
 	}
 	/*
 	 * In transmit state, time the transmission and arrange for the
 	 * retransmit.  In persist state, just set snd_max.
 	 */
 	if (error == 0) {
 		tcp_account_for_send(tp, len, (rsm != NULL), doing_tlp, hw_tls);
 		if (TCPS_HAVEESTABLISHED(tp->t_state) &&
 		    (tp->t_flags & TF_SACK_PERMIT) &&
 		    tp->rcv_numsacks > 0)
 			tcp_clean_dsack_blocks(tp);
 		/* We sent an ack clear the bbr_segs_rcvd count */
 		bbr->output_error_seen = 0;
 		bbr->oerror_cnt = 0;
 		bbr->bbr_segs_rcvd = 0;
 		if (len == 0)
 			counter_u64_add(bbr_out_size[TCP_MSS_ACCT_SNDACK], 1);
 		/* Do accounting for new sends */
 		if ((len > 0) && (rsm == NULL)) {
 			int idx;
 			if (tp->snd_una == tp->snd_max) {
 				/*
 				 * Special case to match google, when
 				 * nothing is in flight the delivered
 				 * time does get updated to the current
 				 * time (see tcp_rate_bsd.c).
 				 */
 				bbr->r_ctl.rc_del_time = cts;
 			}
 			if (len >= maxseg) {
 				idx = (len / maxseg) + 3;
 				if (idx >= TCP_MSS_ACCT_ATIMER)
 					counter_u64_add(bbr_out_size[(TCP_MSS_ACCT_ATIMER - 1)], 1);
 				else
 					counter_u64_add(bbr_out_size[idx], 1);
 			} else {
 				/* smaller than a MSS */
 				idx = len / (bbr_hptsi_bytes_min - bbr->rc_last_options);
 				if (idx >= TCP_MSS_SMALL_MAX_SIZE_DIV)
 					idx = (TCP_MSS_SMALL_MAX_SIZE_DIV - 1);
 				counter_u64_add(bbr_out_size[(idx + TCP_MSS_SMALL_SIZE_OFF)], 1);
 			}
 		}
 	}
 	abandon = 0;
 	/*
 	 * We must do the send accounting before we log the output,
 	 * otherwise the state of the rsm could change and we account to the
 	 * wrong bucket.
 	 */
 	if (len > 0) {
 		bbr_do_send_accounting(tp, bbr, rsm, len, error);
 		if (error == 0) {
 			if (tp->snd_una == tp->snd_max)
 				bbr->r_ctl.rc_tlp_rxt_last_time = cts;
 		}
 	}
 	bbr_log_output(bbr, tp, &to, len, bbr_seq, (uint8_t) flags, error,
 	    cts, mb, &abandon, rsm, 0, sb);
 	if (abandon) {
 		/*
 		 * If bbr_log_output destroys the TCB or sees a TH_RST being
 		 * sent we should hit this condition.
 		 */
 		return (0);
 	}
 	if (bbr->rc_in_persist == 0) {
 		/*
 		 * Advance snd_nxt over sequence space of this segment.
 		 */
 		if (error)
 			/* We don't log or do anything with errors */
 			goto skip_upd;
 
 		if (tp->snd_una == tp->snd_max &&
 		    (len || (flags & (TH_SYN | TH_FIN)))) {
 			/*
 			 * Update the time we just added data since none was
 			 * outstanding.
 			 */
 			bbr_log_progress_event(bbr, tp, ticks, PROGRESS_START, __LINE__);
 			bbr->rc_tp->t_acktime  = ticks;
 		}
 		if (flags & (TH_SYN | TH_FIN) && (rsm == NULL)) {
 			if (flags & TH_SYN) {
 				/*
 				 * Smack the snd_max to iss + 1
 				 * if its a FO we will add len below.
 				 */
 				tp->snd_max = tp->iss + 1;
 			}
 			if ((flags & TH_FIN) && ((tp->t_flags & TF_SENTFIN) == 0)) {
 				tp->snd_max++;
 				tp->t_flags |= TF_SENTFIN;
 			}
 		}
 		if (sack_rxmit == 0)
 			tp->snd_max += len;
 skip_upd:
 		if ((error == 0) && len)
 			tot_len += len;
 	} else {
 		/* Persists case */
 		int32_t xlen = len;
 
 		if (error)
 			goto nomore;
 
 		if (flags & TH_SYN)
 			++xlen;
 		if ((flags & TH_FIN) && ((tp->t_flags & TF_SENTFIN) == 0)) {
 			++xlen;
 			tp->t_flags |= TF_SENTFIN;
 		}
 		if (xlen && (tp->snd_una == tp->snd_max)) {
 			/*
 			 * Update the time we just added data since none was
 			 * outstanding.
 			 */
 			bbr_log_progress_event(bbr, tp, ticks, PROGRESS_START, __LINE__);
 			bbr->rc_tp->t_acktime = ticks;
 		}
 		if (sack_rxmit == 0)
 			tp->snd_max += xlen;
 		tot_len += (len + optlen + ipoptlen);
 	}
 nomore:
 	if (error) {
 		/*
 		 * Failures do not advance the seq counter above. For the
 		 * case of ENOBUFS we will fall out and become ack-clocked.
 		 * capping the cwnd at the current flight.
 		 * Everything else will just have to retransmit with the timer
 		 * (no pacer).
 		 */
 		SOCKBUF_UNLOCK_ASSERT(sb);
 		BBR_STAT_INC(bbr_saw_oerr);
 		/* Clear all delay/early tracks */
 		bbr->r_ctl.rc_hptsi_agg_delay = 0;
 		bbr->r_ctl.rc_agg_early = 0;
 		bbr->r_agg_early_set = 0;
 		bbr->output_error_seen = 1;
 		if (bbr->oerror_cnt < 0xf)
 			bbr->oerror_cnt++;
 		if (bbr_max_net_error_cnt && (bbr->oerror_cnt >= bbr_max_net_error_cnt)) {
 			/* drop the session */
 			return (-ENETDOWN);
 		}
 		switch (error) {
 		case ENOBUFS:
 			/*
 			 * Make this guy have to get ack's to send
 			 * more but lets make sure we don't
 			 * slam him below a T-O (1MSS).
 			 */
 			if (bbr->rc_bbr_state != BBR_STATE_PROBE_RTT) {
 				tp->snd_cwnd = ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 								    bbr->r_ctl.rc_lost_bytes)) - maxseg;
 				if (tp->snd_cwnd < maxseg)
 					tp->snd_cwnd = maxseg;
 			}
 			slot = (bbr_error_base_paceout + 1) << bbr->oerror_cnt;
 			BBR_STAT_INC(bbr_saw_enobuf);
 			if (bbr->bbr_hdrw_pacing)
 				counter_u64_add(bbr_hdwr_pacing_enobuf, 1);
 			else
 				counter_u64_add(bbr_nohdwr_pacing_enobuf, 1);
 			/*
 			 * Here even in the enobuf's case we want to do our
 			 * state update. The reason being we may have been
 			 * called by the input function. If so we have had
 			 * things change.
 			 */
 			error = 0;
 			goto enobufs;
 		case EMSGSIZE:
 			/*
 			 * For some reason the interface we used initially
 			 * to send segments changed to another or lowered
 			 * its MTU. If TSO was active we either got an
 			 * interface without TSO capabilits or TSO was
 			 * turned off. If we obtained mtu from ip_output()
 			 * then update it and try again.
 			 */
 			/* Turn on tracing (or try to) */
 			{
 				int old_maxseg;
 
 				old_maxseg = tp->t_maxseg;
 				BBR_STAT_INC(bbr_saw_emsgsiz);
 				bbr_log_msgsize_fail(bbr, tp, len, maxseg, mtu, csum_flags, tso, cts);
 				if (mtu != 0)
 					tcp_mss_update(tp, -1, mtu, NULL, NULL);
 				if (old_maxseg <= tp->t_maxseg) {
 					/* Huh it did not shrink? */
 					tp->t_maxseg = old_maxseg - 40;
 					bbr_log_msgsize_fail(bbr, tp, len, maxseg, mtu, 0, tso, cts);
 				}
 				/*
 				 * Nuke all other things that can interfere
 				 * with slot
 				 */
 				if ((tot_len + len) && (len >= tp->t_maxseg)) {
 					slot = bbr_get_pacing_delay(bbr,
 					    bbr->r_ctl.rc_bbr_hptsi_gain,
 					    (tot_len + len), cts, 0);
 					if (slot < bbr_error_base_paceout)
 						slot = (bbr_error_base_paceout + 2) << bbr->oerror_cnt;
 				} else
 					slot = (bbr_error_base_paceout + 2) << bbr->oerror_cnt;
 				bbr->rc_output_starts_timer = 1;
 				bbr_start_hpts_timer(bbr, tp, cts, 10, slot,
 				    tot_len);
 				return (error);
 			}
 		case EPERM:
 			tp->t_softerror = error;
-			/* Fall through */
+			/* FALLTHROUGH */
 		case EHOSTDOWN:
 		case EHOSTUNREACH:
 		case ENETDOWN:
 		case ENETUNREACH:
 			if (TCPS_HAVERCVDSYN(tp->t_state)) {
 				tp->t_softerror = error;
 			}
 			/* FALLTHROUGH */
 		default:
 			slot = (bbr_error_base_paceout + 3) << bbr->oerror_cnt;
 			bbr->rc_output_starts_timer = 1;
 			bbr_start_hpts_timer(bbr, tp, cts, 11, slot, 0);
 			return (error);
 		}
 #ifdef STATS
 	} else if (((tp->t_flags & TF_GPUTINPROG) == 0) &&
 		    len &&
 		    (rsm == NULL) &&
 	    (bbr->rc_in_persist == 0)) {
 		tp->gput_seq = bbr_seq;
 		tp->gput_ack = bbr_seq +
 		    min(sbavail(&so->so_snd) - sb_offset, sendwin);
 		tp->gput_ts = cts;
 		tp->t_flags |= TF_GPUTINPROG;
 #endif
 	}
 	KMOD_TCPSTAT_INC(tcps_sndtotal);
 	if ((bbr->bbr_hdw_pace_ena) &&
 	    (bbr->bbr_attempt_hdwr_pace == 0) &&
 	    (bbr->rc_past_init_win) &&
 	    (bbr->rc_bbr_state != BBR_STATE_STARTUP) &&
 	    (get_filter_value(&bbr->r_ctl.rc_delrate)) &&
 	    (inp->inp_route.ro_nh &&
 	     inp->inp_route.ro_nh->nh_ifp)) {
 		/*
 		 * We are past the initial window and
 		 * have at least one measurement so we
 		 * could use hardware pacing if its available.
 		 * We have an interface and we have not attempted
 		 * to setup hardware pacing, lets try to now.
 		 */
 		uint64_t rate_wanted;
 		int err = 0;
 
 		rate_wanted = bbr_get_hardware_rate(bbr);
 		bbr->bbr_attempt_hdwr_pace = 1;
 		bbr->r_ctl.crte = tcp_set_pacing_rate(bbr->rc_tp,
 						      inp->inp_route.ro_nh->nh_ifp,
 						      rate_wanted,
 						      (RS_PACING_GEQ|RS_PACING_SUB_OK),
 						      &err, NULL);
 		if (bbr->r_ctl.crte) {
 			bbr_type_log_hdwr_pacing(bbr,
 						 bbr->r_ctl.crte->ptbl->rs_ifp,
 						 rate_wanted,
 						 bbr->r_ctl.crte->rate,
 						 __LINE__, cts, err);
 			BBR_STAT_INC(bbr_hdwr_rl_add_ok);
 			counter_u64_add(bbr_flows_nohdwr_pacing, -1);
 			counter_u64_add(bbr_flows_whdwr_pacing, 1);
 			bbr->bbr_hdrw_pacing = 1;
 			/* Now what is our gain status? */
 			if (bbr->r_ctl.crte->rate < rate_wanted) {
 				/* We have a problem */
 				bbr_setup_less_of_rate(bbr, cts,
 						       bbr->r_ctl.crte->rate, rate_wanted);
 			} else {
 				/* We are good */
 				bbr->gain_is_limited = 0;
 				bbr->skip_gain = 0;
 			}
 			tcp_bbr_tso_size_check(bbr, cts);
 		} else {
 			bbr_type_log_hdwr_pacing(bbr,
 						 inp->inp_route.ro_nh->nh_ifp,
 						 rate_wanted,
 						 0,
 						 __LINE__, cts, err);
 			BBR_STAT_INC(bbr_hdwr_rl_add_fail);
 		}
 	}
 	if (bbr->bbr_hdrw_pacing) {
 		/*
 		 * Worry about cases where the route
 		 * changes or something happened that we
 		 * lost our hardware pacing possibly during
 		 * the last ip_output call.
 		 */
 		if (inp->inp_snd_tag == NULL) {
 			/* A change during ip output disabled hw pacing? */
 			bbr->bbr_hdrw_pacing = 0;
 		} else if ((inp->inp_route.ro_nh == NULL) ||
 		    (inp->inp_route.ro_nh->nh_ifp != inp->inp_snd_tag->ifp)) {
 			/*
 			 * We had an interface or route change,
 			 * detach from the current hdwr pacing
 			 * and setup to re-attempt next go
 			 * round.
 			 */
 			bbr->bbr_hdrw_pacing = 0;
 			bbr->bbr_attempt_hdwr_pace = 0;
 			tcp_rel_pacing_rate(bbr->r_ctl.crte, bbr->rc_tp);
 			tcp_bbr_tso_size_check(bbr, cts);
 		}
 	}
 	/*
 	 * Data sent (as far as we can tell). If this advertises a larger
 	 * window than any other segment, then remember the size of the
 	 * advertised window. Any pending ACK has now been sent.
 	 */
 	if (SEQ_GT(tp->rcv_nxt + recwin, tp->rcv_adv))
 		tp->rcv_adv = tp->rcv_nxt + recwin;
 
 	tp->last_ack_sent = tp->rcv_nxt;
 	if ((error == 0) &&
 	    (bbr->r_ctl.rc_pace_max_segs > tp->t_maxseg) &&
 	    (doing_tlp == 0) &&
 	    (tso == 0) &&
 	    (len > 0) &&
 	    ((flags & TH_RST) == 0) &&
 	    ((flags & TH_SYN) == 0) &&
 	    (IN_RECOVERY(tp->t_flags) == 0) &&
 	    (bbr->rc_in_persist == 0) &&
 	    (tot_len < bbr->r_ctl.rc_pace_max_segs)) {
 		/*
 		 * For non-tso we need to goto again until we have sent out
 		 * enough data to match what we are hptsi out every hptsi
 		 * interval.
 		 */
 		if (SEQ_LT(tp->snd_nxt, tp->snd_max)) {
 			/* Make sure snd_nxt is drug up */
 			tp->snd_nxt = tp->snd_max;
 		}
 		if (rsm != NULL) {
 			rsm = NULL;
 			goto skip_again;
 		}
 		rsm = NULL;
 		sack_rxmit = 0;
 		tp->t_flags &= ~(TF_ACKNOW | TF_DELACK);
 		goto again;
 	}
 skip_again:
 	if ((error == 0) && (flags & TH_FIN))
 		tcp_log_end_status(tp, TCP_EI_STATUS_SERVER_FIN);
 	if ((error == 0) && (flags & TH_RST))
 		tcp_log_end_status(tp, TCP_EI_STATUS_SERVER_RST);
 	if (((flags & (TH_RST | TH_SYN | TH_FIN)) == 0) && tot_len) {
 		/*
 		 * Calculate/Re-Calculate the hptsi slot in usecs based on
 		 * what we have sent so far
 		 */
 		slot = bbr_get_pacing_delay(bbr, bbr->r_ctl.rc_bbr_hptsi_gain, tot_len, cts, 0);
 		if (bbr->rc_no_pacing)
 			slot = 0;
 	}
 	tp->t_flags &= ~(TF_ACKNOW | TF_DELACK);
 enobufs:
 	if (bbr->rc_use_google == 0)
 		bbr_check_bbr_for_state(bbr, cts, __LINE__, 0);
 	bbr_cwnd_limiting(tp, bbr, ctf_flight_size(tp, (bbr->r_ctl.rc_sacked +
 							bbr->r_ctl.rc_lost_bytes)));
 	bbr->rc_output_starts_timer = 1;
 	if (bbr->bbr_use_rack_cheat &&
 	    (more_to_rxt ||
 	     ((bbr->r_ctl.rc_resend = bbr_check_recovery_mode(tp, bbr, cts)) != NULL))) {
 		/* Rack cheats and shotguns out all rxt's 1ms apart */
 		if (slot > 1000)
 			slot = 1000;
 	}
 	if (bbr->bbr_hdrw_pacing && (bbr->hw_pacing_set == 0)) {
 		/*
 		 * We don't change the tso size until some number of sends
 		 * to give the hardware commands time to get down
 		 * to the interface.
 		 */
 		bbr->r_ctl.bbr_hdwr_cnt_noset_snt++;
 		if (bbr->r_ctl.bbr_hdwr_cnt_noset_snt >= bbr_hdwr_pacing_delay_cnt) {
 			bbr->hw_pacing_set = 1;
 			tcp_bbr_tso_size_check(bbr, cts);
 		}
 	}
 	bbr_start_hpts_timer(bbr, tp, cts, 12, slot, tot_len);
 	if (SEQ_LT(tp->snd_nxt, tp->snd_max)) {
 		/* Make sure snd_nxt is drug up */
 		tp->snd_nxt = tp->snd_max;
 	}
 	return (error);
 
 }
 
 /*
  * See bbr_output_wtime() for return values.
  */
 static int
 bbr_output(struct tcpcb *tp)
 {
 	int32_t ret;
 	struct timeval tv;
 
 	NET_EPOCH_ASSERT();
 
 	INP_WLOCK_ASSERT(tptoinpcb(tp));
 	(void)tcp_get_usecs(&tv);
 	ret = bbr_output_wtime(tp, &tv);
 	return (ret);
 }
 
 static void
 bbr_mtu_chg(struct tcpcb *tp)
 {
 	struct tcp_bbr *bbr;
 	struct bbr_sendmap *rsm, *frsm = NULL;
 	uint32_t maxseg;
 
 	/*
 	 * The MTU has changed. a) Clear the sack filter. b) Mark everything
 	 * over the current size as SACK_PASS so a retransmit will occur.
 	 */
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	maxseg = tp->t_maxseg - bbr->rc_last_options;
 	sack_filter_clear(&bbr->r_ctl.bbr_sf, tp->snd_una);
 	TAILQ_FOREACH(rsm, &bbr->r_ctl.rc_map, r_next) {
 		/* Don't mess with ones acked (by sack?) */
 		if (rsm->r_flags & BBR_ACKED)
 			continue;
 		if ((rsm->r_end - rsm->r_start) > maxseg) {
 			/*
 			 * We mark sack-passed on all the previous large
 			 * sends we did. This will force them to retransmit.
 			 */
 			rsm->r_flags |= BBR_SACK_PASSED;
 			if (((rsm->r_flags & BBR_MARKED_LOST) == 0) &&
 			    bbr_is_lost(bbr, rsm, bbr->r_ctl.rc_rcvtime)) {
 				bbr->r_ctl.rc_lost_bytes += rsm->r_end - rsm->r_start;
 				bbr->r_ctl.rc_lost += rsm->r_end - rsm->r_start;
 				rsm->r_flags |= BBR_MARKED_LOST;
 			}
 			if (frsm == NULL)
 				frsm = rsm;
 		}
 	}
 	if (frsm) {
 		bbr->r_ctl.rc_resend = frsm;
 	}
 }
 
 static int
 bbr_pru_options(struct tcpcb *tp, int flags)
 {
 	if (flags & PRUS_OOB)
 		return (EOPNOTSUPP);
 	return (0);
 }
 
 static void
 bbr_switch_failed(struct tcpcb *tp)
 {
 	/*
 	 * If a switch fails we only need to
 	 * make sure mbuf_queuing is still in place.
 	 * We also need to make sure we are still in
 	 * ticks granularity (though we should probably
 	 * change bbr to go to USECs).
 	 *
 	 * For timers we need to see if we are still in the
 	 * pacer (if our flags are up) if so we are good, if
 	 * not we need to get back into the pacer.
 	 */
 	struct timeval tv;
 	uint32_t cts;
 	uint32_t toval;
 	struct tcp_bbr *bbr;
 	struct hpts_diag diag;
 
 	tp->t_flags2 |= TF2_CANNOT_DO_ECN;
 	tp->t_flags2 |= TF2_SUPPORTS_MBUFQ;
 	tcp_change_time_units(tp, TCP_TMR_GRANULARITY_TICKS);
 	if (tp->t_in_hpts > IHPTS_NONE) {
 		return;
 	}
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	cts = tcp_get_usecs(&tv);
 	if (bbr->r_ctl.rc_hpts_flags & PACE_PKT_OUTPUT) {
 		if (TSTMP_GT(bbr->rc_pacer_started, cts)) {
 			toval = bbr->rc_pacer_started - cts;
 		} else {
 			/* one slot please */
 			toval = HPTS_TICKS_PER_SLOT;
 		}
 	} else if (bbr->r_ctl.rc_hpts_flags & PACE_TMR_MASK) {
 		if (TSTMP_GT(bbr->r_ctl.rc_timer_exp, cts)) {
 			toval = bbr->r_ctl.rc_timer_exp - cts;
 		} else {
 			/* one slot please */
 			toval = HPTS_TICKS_PER_SLOT;
 		}
 	} else
 		toval = HPTS_TICKS_PER_SLOT;
 	(void)tcp_hpts_insert_diag(tp, HPTS_USEC_TO_SLOTS(toval),
 				   __LINE__, &diag);
 	bbr_log_hpts_diag(bbr, cts, &diag);
 }
 
 struct tcp_function_block __tcp_bbr = {
 	.tfb_tcp_block_name = __XSTRING(STACKNAME),
 	.tfb_tcp_output = bbr_output,
 	.tfb_do_queued_segments = ctf_do_queued_segments,
 	.tfb_do_segment_nounlock = bbr_do_segment_nounlock,
 	.tfb_tcp_do_segment = bbr_do_segment,
 	.tfb_tcp_ctloutput = bbr_ctloutput,
 	.tfb_tcp_fb_init = bbr_init,
 	.tfb_tcp_fb_fini = bbr_fini,
 	.tfb_tcp_timer_stop_all = bbr_stopall,
 	.tfb_tcp_rexmit_tmr = bbr_remxt_tmr,
 	.tfb_tcp_handoff_ok = bbr_handoff_ok,
 	.tfb_tcp_mtu_chg = bbr_mtu_chg,
 	.tfb_pru_options = bbr_pru_options,
 	.tfb_switch_failed = bbr_switch_failed,
 	.tfb_flags = TCP_FUNC_OUTPUT_CANDROP,
 };
 
 /*
  * bbr_ctloutput() must drop the inpcb lock before performing copyin on
  * socket option arguments.  When it re-acquires the lock after the copy, it
  * has to revalidate that the connection is still valid for the socket
  * option.
  */
 static int
 bbr_set_sockopt(struct tcpcb *tp, struct sockopt *sopt)
 {
 	struct epoch_tracker et;
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_bbr *bbr;
 	int32_t error = 0, optval;
 
 	switch (sopt->sopt_level) {
 	case IPPROTO_IPV6:
 	case IPPROTO_IP:
 		return (tcp_default_ctloutput(tp, sopt));
 	}
 
 	switch (sopt->sopt_name) {
 	case TCP_RACK_PACE_MAX_SEG:
 	case TCP_RACK_MIN_TO:
 	case TCP_RACK_REORD_THRESH:
 	case TCP_RACK_REORD_FADE:
 	case TCP_RACK_TLP_THRESH:
 	case TCP_RACK_PKT_DELAY:
 	case TCP_BBR_ALGORITHM:
 	case TCP_BBR_TSLIMITS:
 	case TCP_BBR_IWINTSO:
 	case TCP_BBR_RECFORCE:
 	case TCP_BBR_STARTUP_PG:
 	case TCP_BBR_DRAIN_PG:
 	case TCP_BBR_RWND_IS_APP:
 	case TCP_BBR_PROBE_RTT_INT:
 	case TCP_BBR_PROBE_RTT_GAIN:
 	case TCP_BBR_PROBE_RTT_LEN:
 	case TCP_BBR_STARTUP_LOSS_EXIT:
 	case TCP_BBR_USEDEL_RATE:
 	case TCP_BBR_MIN_RTO:
 	case TCP_BBR_MAX_RTO:
 	case TCP_BBR_PACE_PER_SEC:
 	case TCP_DELACK:
 	case TCP_BBR_PACE_DEL_TAR:
 	case TCP_BBR_SEND_IWND_IN_TSO:
 	case TCP_BBR_EXTRA_STATE:
 	case TCP_BBR_UTTER_MAX_TSO:
 	case TCP_BBR_MIN_TOPACEOUT:
 	case TCP_BBR_FLOOR_MIN_TSO:
 	case TCP_BBR_TSTMP_RAISES:
 	case TCP_BBR_POLICER_DETECT:
 	case TCP_BBR_USE_RACK_CHEAT:
 	case TCP_DATA_AFTER_CLOSE:
 	case TCP_BBR_HDWR_PACE:
 	case TCP_BBR_PACE_SEG_MAX:
 	case TCP_BBR_PACE_SEG_MIN:
 	case TCP_BBR_PACE_CROSS:
 	case TCP_BBR_PACE_OH:
 	case TCP_BBR_TMR_PACE_OH:
 	case TCP_BBR_RACK_RTT_USE:
 	case TCP_BBR_RETRAN_WTSO:
 		break;
 	default:
 		return (tcp_default_ctloutput(tp, sopt));
 		break;
 	}
 	INP_WUNLOCK(inp);
 	error = sooptcopyin(sopt, &optval, sizeof(optval), sizeof(optval));
 	if (error)
 		return (error);
 	INP_WLOCK(inp);
 	if (inp->inp_flags & INP_DROPPED) {
 		INP_WUNLOCK(inp);
 		return (ECONNRESET);
 	}
 	if (tp->t_fb != &__tcp_bbr) {
 		INP_WUNLOCK(inp);
 		return (ENOPROTOOPT);
 	}
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	switch (sopt->sopt_name) {
 	case TCP_BBR_PACE_PER_SEC:
 		BBR_OPTS_INC(tcp_bbr_pace_per_sec);
 		bbr->r_ctl.bbr_hptsi_per_second = optval;
 		break;
 	case TCP_BBR_PACE_DEL_TAR:
 		BBR_OPTS_INC(tcp_bbr_pace_del_tar);
 		bbr->r_ctl.bbr_hptsi_segments_delay_tar = optval;
 		break;
 	case TCP_BBR_PACE_SEG_MAX:
 		BBR_OPTS_INC(tcp_bbr_pace_seg_max);
 		bbr->r_ctl.bbr_hptsi_segments_max = optval;
 		break;
 	case TCP_BBR_PACE_SEG_MIN:
 		BBR_OPTS_INC(tcp_bbr_pace_seg_min);
 		bbr->r_ctl.bbr_hptsi_bytes_min = optval;
 		break;
 	case TCP_BBR_PACE_CROSS:
 		BBR_OPTS_INC(tcp_bbr_pace_cross);
 		bbr->r_ctl.bbr_cross_over = optval;
 		break;
 	case TCP_BBR_ALGORITHM:
 		BBR_OPTS_INC(tcp_bbr_algorithm);
 		if (optval && (bbr->rc_use_google == 0)) {
 			/* Turn on the google mode */
 			bbr_google_mode_on(bbr);
 			if ((optval > 3) && (optval < 500)) {
 				/*
 				 * Must be at least greater than .3%
 				 * and must be less than 50.0%.
 				 */
 				bbr->r_ctl.bbr_google_discount = optval;
 			}
 		} else if ((optval == 0) && (bbr->rc_use_google == 1)) {
 			/* Turn off the google mode */
 			bbr_google_mode_off(bbr);
 		}
 		break;
 	case TCP_BBR_TSLIMITS:
 		BBR_OPTS_INC(tcp_bbr_tslimits);
 		if (optval == 1)
 			bbr->rc_use_ts_limit = 1;
 		else if (optval == 0)
 			bbr->rc_use_ts_limit = 0;
 		else
 			error = EINVAL;
 		break;
 
 	case TCP_BBR_IWINTSO:
 		BBR_OPTS_INC(tcp_bbr_iwintso);
 		if ((optval >= 0) && (optval < 128)) {
 			uint32_t twin;
 
 			bbr->rc_init_win = optval;
 			twin = bbr_initial_cwnd(bbr, tp);
 			if ((bbr->rc_past_init_win == 0) && (twin > tp->snd_cwnd))
 				tp->snd_cwnd = twin;
 			else
 				error = EBUSY;
 		} else
 			error = EINVAL;
 		break;
 	case TCP_BBR_STARTUP_PG:
 		BBR_OPTS_INC(tcp_bbr_startup_pg);
 		if ((optval > 0) && (optval < BBR_MAX_GAIN_VALUE)) {
 			bbr->r_ctl.rc_startup_pg = optval;
 			if (bbr->rc_bbr_state == BBR_STATE_STARTUP) {
 				bbr->r_ctl.rc_bbr_hptsi_gain = optval;
 			}
 		} else
 			error = EINVAL;
 		break;
 	case TCP_BBR_DRAIN_PG:
 		BBR_OPTS_INC(tcp_bbr_drain_pg);
 		if ((optval > 0) && (optval < BBR_MAX_GAIN_VALUE))
 			bbr->r_ctl.rc_drain_pg = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_PROBE_RTT_LEN:
 		BBR_OPTS_INC(tcp_bbr_probertt_len);
 		if (optval <= 1)
 			reset_time_small(&bbr->r_ctl.rc_rttprop, (optval * USECS_IN_SECOND));
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_PROBE_RTT_GAIN:
 		BBR_OPTS_INC(tcp_bbr_probertt_gain);
 		if (optval <= BBR_UNIT)
 			bbr->r_ctl.bbr_rttprobe_gain_val = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_PROBE_RTT_INT:
 		BBR_OPTS_INC(tcp_bbr_probe_rtt_int);
 		if (optval > 1000)
 			bbr->r_ctl.rc_probertt_int = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_MIN_TOPACEOUT:
 		BBR_OPTS_INC(tcp_bbr_topaceout);
 		if (optval == 0) {
 			bbr->no_pacing_until = 0;
 			bbr->rc_no_pacing = 0;
 		} else if (optval <= 0x00ff) {
 			bbr->no_pacing_until = optval;
 			if ((bbr->r_ctl.rc_pkt_epoch < bbr->no_pacing_until) &&
 			    (bbr->rc_bbr_state == BBR_STATE_STARTUP)){
 				/* Turn on no pacing */
 				bbr->rc_no_pacing = 1;
 			}
 		} else
 			error = EINVAL;
 		break;
 	case TCP_BBR_STARTUP_LOSS_EXIT:
 		BBR_OPTS_INC(tcp_bbr_startup_loss_exit);
 		bbr->rc_loss_exit = optval;
 		break;
 	case TCP_BBR_USEDEL_RATE:
 		error = EINVAL;
 		break;
 	case TCP_BBR_MIN_RTO:
 		BBR_OPTS_INC(tcp_bbr_min_rto);
 		bbr->r_ctl.rc_min_rto_ms = optval;
 		break;
 	case TCP_BBR_MAX_RTO:
 		BBR_OPTS_INC(tcp_bbr_max_rto);
 		bbr->rc_max_rto_sec = optval;
 		break;
 	case TCP_RACK_MIN_TO:
 		/* Minimum time between rack t-o's in ms */
 		BBR_OPTS_INC(tcp_rack_min_to);
 		bbr->r_ctl.rc_min_to = optval;
 		break;
 	case TCP_RACK_REORD_THRESH:
 		/* RACK reorder threshold (shift amount) */
 		BBR_OPTS_INC(tcp_rack_reord_thresh);
 		if ((optval > 0) && (optval < 31))
 			bbr->r_ctl.rc_reorder_shift = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_RACK_REORD_FADE:
 		/* Does reordering fade after ms time */
 		BBR_OPTS_INC(tcp_rack_reord_fade);
 		bbr->r_ctl.rc_reorder_fade = optval;
 		break;
 	case TCP_RACK_TLP_THRESH:
 		/* RACK TLP theshold i.e. srtt+(srtt/N) */
 		BBR_OPTS_INC(tcp_rack_tlp_thresh);
 		if (optval)
 			bbr->rc_tlp_threshold = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_USE_RACK_CHEAT:
 		BBR_OPTS_INC(tcp_use_rackcheat);
 		if (bbr->rc_use_google) {
 			error = EINVAL;
 			break;
 		}
 		BBR_OPTS_INC(tcp_rack_cheat);
 		if (optval)
 			bbr->bbr_use_rack_cheat = 1;
 		else
 			bbr->bbr_use_rack_cheat = 0;
 		break;
 	case TCP_BBR_FLOOR_MIN_TSO:
 		BBR_OPTS_INC(tcp_utter_max_tso);
 		if ((optval >= 0) && (optval < 40))
 			bbr->r_ctl.bbr_hptsi_segments_floor = optval;
 		else
 			error = EINVAL;
 		break;
 	case TCP_BBR_UTTER_MAX_TSO:
 		BBR_OPTS_INC(tcp_utter_max_tso);
 		if ((optval >= 0) && (optval < 0xffff))
 			bbr->r_ctl.bbr_utter_max = optval;
 		else
 			error = EINVAL;
 		break;
 
 	case TCP_BBR_EXTRA_STATE:
 		BBR_OPTS_INC(tcp_extra_state);
 		if (optval)
 			bbr->rc_use_idle_restart = 1;
 		else
 			bbr->rc_use_idle_restart = 0;
 		break;
 	case TCP_BBR_SEND_IWND_IN_TSO:
 		BBR_OPTS_INC(tcp_iwnd_tso);
 		if (optval) {
 			bbr->bbr_init_win_cheat = 1;
 			if (bbr->rc_past_init_win == 0) {
 				uint32_t cts;
 				cts = tcp_get_usecs(&bbr->rc_tv);
 				tcp_bbr_tso_size_check(bbr, cts);
 			}
 		} else
 			bbr->bbr_init_win_cheat = 0;
 		break;
 	case TCP_BBR_HDWR_PACE:
 		BBR_OPTS_INC(tcp_hdwr_pacing);
 		if (optval){
 			bbr->bbr_hdw_pace_ena = 1;
 			bbr->bbr_attempt_hdwr_pace = 0;
 		} else {
 			bbr->bbr_hdw_pace_ena = 0;
 #ifdef RATELIMIT
 			if (bbr->r_ctl.crte != NULL) {
 				tcp_rel_pacing_rate(bbr->r_ctl.crte, tp);
 				bbr->r_ctl.crte = NULL;
 			}
 #endif
 		}
 		break;
 
 	case TCP_DELACK:
 		BBR_OPTS_INC(tcp_delack);
 		if (optval < 100) {
 			if (optval == 0) /* off */
 				tp->t_delayed_ack = 0;
 			else if (optval == 1) /* on which is 2 */
 				tp->t_delayed_ack = 2;
 			else /* higher than 2 and less than 100 */
 				tp->t_delayed_ack = optval;
 			if (tp->t_flags & TF_DELACK) {
 				tp->t_flags &= ~TF_DELACK;
 				tp->t_flags |= TF_ACKNOW;
 				NET_EPOCH_ENTER(et);
 				bbr_output(tp);
 				NET_EPOCH_EXIT(et);
 			}
 		} else
 			error = EINVAL;
 		break;
 	case TCP_RACK_PKT_DELAY:
 		/* RACK added ms i.e. rack-rtt + reord + N */
 		BBR_OPTS_INC(tcp_rack_pkt_delay);
 		bbr->r_ctl.rc_pkt_delay = optval;
 		break;
 
 	case TCP_BBR_RETRAN_WTSO:
 		BBR_OPTS_INC(tcp_retran_wtso);
 		if (optval)
 			bbr->rc_resends_use_tso = 1;
 		else
 			bbr->rc_resends_use_tso = 0;
 		break;
 	case TCP_DATA_AFTER_CLOSE:
 		BBR_OPTS_INC(tcp_data_ac);
 		if (optval)
 			bbr->rc_allow_data_af_clo = 1;
 		else
 			bbr->rc_allow_data_af_clo = 0;
 		break;
 	case TCP_BBR_POLICER_DETECT:
 		BBR_OPTS_INC(tcp_policer_det);
 		if (bbr->rc_use_google == 0)
 			error = EINVAL;
 		else if (optval)
 			bbr->r_use_policer = 1;
 		else
 			bbr->r_use_policer = 0;
 		break;
 
 	case TCP_BBR_TSTMP_RAISES:
 		BBR_OPTS_INC(tcp_ts_raises);
 		if (optval)
 			bbr->ts_can_raise = 1;
 		else
 			bbr->ts_can_raise = 0;
 		break;
 	case TCP_BBR_TMR_PACE_OH:
 		BBR_OPTS_INC(tcp_pacing_oh_tmr);
 		if (bbr->rc_use_google) {
 			error = EINVAL;
 		} else {
 			if (optval)
 				bbr->r_ctl.rc_incr_tmrs = 1;
 			else
 				bbr->r_ctl.rc_incr_tmrs = 0;
 		}
 		break;
 	case TCP_BBR_PACE_OH:
 		BBR_OPTS_INC(tcp_pacing_oh);
 		if (bbr->rc_use_google) {
 			error = EINVAL;
 		} else {
 			if (optval > (BBR_INCL_TCP_OH|
 				      BBR_INCL_IP_OH|
 				      BBR_INCL_ENET_OH)) {
 				error = EINVAL;
 				break;
 			}
 			if (optval & BBR_INCL_TCP_OH)
 				bbr->r_ctl.rc_inc_tcp_oh = 1;
 			else
 				bbr->r_ctl.rc_inc_tcp_oh = 0;
 			if (optval & BBR_INCL_IP_OH)
 				bbr->r_ctl.rc_inc_ip_oh = 1;
 			else
 				bbr->r_ctl.rc_inc_ip_oh = 0;
 			if (optval & BBR_INCL_ENET_OH)
 				bbr->r_ctl.rc_inc_enet_oh = 1;
 			else
 				bbr->r_ctl.rc_inc_enet_oh = 0;
 		}
 		break;
 	default:
 		return (tcp_default_ctloutput(tp, sopt));
 		break;
 	}
 	tcp_log_socket_option(tp, sopt->sopt_name, optval, error);
 	INP_WUNLOCK(inp);
 	return (error);
 }
 
 /*
  * return 0 on success, error-num on failure
  */
 static int
 bbr_get_sockopt(struct tcpcb *tp, struct sockopt *sopt)
 {
 	struct inpcb *inp = tptoinpcb(tp);
 	struct tcp_bbr *bbr;
 	int32_t error, optval;
 
 	bbr = (struct tcp_bbr *)tp->t_fb_ptr;
 	if (bbr == NULL) {
 		INP_WUNLOCK(inp);
 		return (EINVAL);
 	}
 	/*
 	 * Because all our options are either boolean or an int, we can just
 	 * pull everything into optval and then unlock and copy. If we ever
 	 * add a option that is not a int, then this will have quite an
 	 * impact to this routine.
 	 */
 	switch (sopt->sopt_name) {
 	case TCP_BBR_PACE_PER_SEC:
 		optval = bbr->r_ctl.bbr_hptsi_per_second;
 		break;
 	case TCP_BBR_PACE_DEL_TAR:
 		optval = bbr->r_ctl.bbr_hptsi_segments_delay_tar;
 		break;
 	case TCP_BBR_PACE_SEG_MAX:
 		optval = bbr->r_ctl.bbr_hptsi_segments_max;
 		break;
 	case TCP_BBR_MIN_TOPACEOUT:
 		optval = bbr->no_pacing_until;
 		break;
 	case TCP_BBR_PACE_SEG_MIN:
 		optval = bbr->r_ctl.bbr_hptsi_bytes_min;
 		break;
 	case TCP_BBR_PACE_CROSS:
 		optval = bbr->r_ctl.bbr_cross_over;
 		break;
 	case TCP_BBR_ALGORITHM:
 		optval = bbr->rc_use_google;
 		break;
 	case TCP_BBR_TSLIMITS:
 		optval = bbr->rc_use_ts_limit;
 		break;
 	case TCP_BBR_IWINTSO:
 		optval = bbr->rc_init_win;
 		break;
 	case TCP_BBR_STARTUP_PG:
 		optval = bbr->r_ctl.rc_startup_pg;
 		break;
 	case TCP_BBR_DRAIN_PG:
 		optval = bbr->r_ctl.rc_drain_pg;
 		break;
 	case TCP_BBR_PROBE_RTT_INT:
 		optval = bbr->r_ctl.rc_probertt_int;
 		break;
 	case TCP_BBR_PROBE_RTT_LEN:
 		optval = (bbr->r_ctl.rc_rttprop.cur_time_limit / USECS_IN_SECOND);
 		break;
 	case TCP_BBR_PROBE_RTT_GAIN:
 		optval = bbr->r_ctl.bbr_rttprobe_gain_val;
 		break;
 	case TCP_BBR_STARTUP_LOSS_EXIT:
 		optval = bbr->rc_loss_exit;
 		break;
 	case TCP_BBR_USEDEL_RATE:
 		error = EINVAL;
 		break;
 	case TCP_BBR_MIN_RTO:
 		optval = bbr->r_ctl.rc_min_rto_ms;
 		break;
 	case TCP_BBR_MAX_RTO:
 		optval = bbr->rc_max_rto_sec;
 		break;
 	case TCP_RACK_PACE_MAX_SEG:
 		/* Max segments in a pace */
 		optval = bbr->r_ctl.rc_pace_max_segs;
 		break;
 	case TCP_RACK_MIN_TO:
 		/* Minimum time between rack t-o's in ms */
 		optval = bbr->r_ctl.rc_min_to;
 		break;
 	case TCP_RACK_REORD_THRESH:
 		/* RACK reorder threshold (shift amount) */
 		optval = bbr->r_ctl.rc_reorder_shift;
 		break;
 	case TCP_RACK_REORD_FADE:
 		/* Does reordering fade after ms time */
 		optval = bbr->r_ctl.rc_reorder_fade;
 		break;
 	case TCP_BBR_USE_RACK_CHEAT:
 		/* Do we use the rack cheat for rxt */
 		optval = bbr->bbr_use_rack_cheat;
 		break;
 	case TCP_BBR_FLOOR_MIN_TSO:
 		optval = bbr->r_ctl.bbr_hptsi_segments_floor;
 		break;
 	case TCP_BBR_UTTER_MAX_TSO:
 		optval = bbr->r_ctl.bbr_utter_max;
 		break;
 	case TCP_BBR_SEND_IWND_IN_TSO:
 		/* Do we send TSO size segments initially */
 		optval = bbr->bbr_init_win_cheat;
 		break;
 	case TCP_BBR_EXTRA_STATE:
 		optval = bbr->rc_use_idle_restart;
 		break;
 	case TCP_RACK_TLP_THRESH:
 		/* RACK TLP theshold i.e. srtt+(srtt/N) */
 		optval = bbr->rc_tlp_threshold;
 		break;
 	case TCP_RACK_PKT_DELAY:
 		/* RACK added ms i.e. rack-rtt + reord + N */
 		optval = bbr->r_ctl.rc_pkt_delay;
 		break;
 	case TCP_BBR_RETRAN_WTSO:
 		optval = bbr->rc_resends_use_tso;
 		break;
 	case TCP_DATA_AFTER_CLOSE:
 		optval = bbr->rc_allow_data_af_clo;
 		break;
 	case TCP_DELACK:
 		optval = tp->t_delayed_ack;
 		break;
 	case TCP_BBR_HDWR_PACE:
 		optval = bbr->bbr_hdw_pace_ena;
 		break;
 	case TCP_BBR_POLICER_DETECT:
 		optval = bbr->r_use_policer;
 		break;
 	case TCP_BBR_TSTMP_RAISES:
 		optval = bbr->ts_can_raise;
 		break;
 	case TCP_BBR_TMR_PACE_OH:
 		optval = bbr->r_ctl.rc_incr_tmrs;
 		break;
 	case TCP_BBR_PACE_OH:
 		optval = 0;
 		if (bbr->r_ctl.rc_inc_tcp_oh)
 			optval |= BBR_INCL_TCP_OH;
 		if (bbr->r_ctl.rc_inc_ip_oh)
 			optval |= BBR_INCL_IP_OH;
 		if (bbr->r_ctl.rc_inc_enet_oh)
 			optval |= BBR_INCL_ENET_OH;
 		break;
 	default:
 		return (tcp_default_ctloutput(tp, sopt));
 		break;
 	}
 	INP_WUNLOCK(inp);
 	error = sooptcopyout(sopt, &optval, sizeof optval);
 	return (error);
 }
 
 /*
  * return 0 on success, error-num on failure
  */
 static int
 bbr_ctloutput(struct tcpcb *tp, struct sockopt *sopt)
 {
 	if (sopt->sopt_dir == SOPT_SET) {
 		return (bbr_set_sockopt(tp, sopt));
 	} else if (sopt->sopt_dir == SOPT_GET) {
 		return (bbr_get_sockopt(tp, sopt));
 	} else {
 		panic("%s: sopt_dir $%d", __func__, sopt->sopt_dir);
 	}
 }
 
 static const char *bbr_stack_names[] = {
 	__XSTRING(STACKNAME),
 #ifdef STACKALIAS
 	__XSTRING(STACKALIAS),
 #endif
 };
 
 static bool bbr_mod_inited = false;
 
 static int
 tcp_addbbr(module_t mod, int32_t type, void *data)
 {
 	int32_t err = 0;
 	int num_stacks;
 
 	switch (type) {
 	case MOD_LOAD:
 		printf("Attempting to load " __XSTRING(MODNAME) "\n");
 		bbr_zone = uma_zcreate(__XSTRING(MODNAME) "_map",
 		    sizeof(struct bbr_sendmap),
 		    NULL, NULL, NULL, NULL, UMA_ALIGN_PTR, 0);
 		bbr_pcb_zone = uma_zcreate(__XSTRING(MODNAME) "_pcb",
 		    sizeof(struct tcp_bbr),
 		    NULL, NULL, NULL, NULL, UMA_ALIGN_CACHE, 0);
 		sysctl_ctx_init(&bbr_sysctl_ctx);
 		bbr_sysctl_root = SYSCTL_ADD_NODE(&bbr_sysctl_ctx,
 		    SYSCTL_STATIC_CHILDREN(_net_inet_tcp),
 		    OID_AUTO,
 #ifdef STACKALIAS
 		    __XSTRING(STACKALIAS),
 #else
 		    __XSTRING(STACKNAME),
 #endif
 		    CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
 		    "");
 		if (bbr_sysctl_root == NULL) {
 			printf("Failed to add sysctl node\n");
 			err = EFAULT;
 			goto free_uma;
 		}
 		bbr_init_sysctls();
 		num_stacks = nitems(bbr_stack_names);
 		err = register_tcp_functions_as_names(&__tcp_bbr, M_WAITOK,
 		    bbr_stack_names, &num_stacks);
 		if (err) {
 			printf("Failed to register %s stack name for "
 			    "%s module\n", bbr_stack_names[num_stacks],
 			    __XSTRING(MODNAME));
 			sysctl_ctx_free(&bbr_sysctl_ctx);
 	free_uma:
 			uma_zdestroy(bbr_zone);
 			uma_zdestroy(bbr_pcb_zone);
 			bbr_counter_destroy();
 			printf("Failed to register " __XSTRING(MODNAME)
 			    " module err:%d\n", err);
 			return (err);
 		}
 		tcp_lro_reg_mbufq();
 		bbr_mod_inited = true;
 		printf(__XSTRING(MODNAME) " is now available\n");
 		break;
 	case MOD_QUIESCE:
 		err = deregister_tcp_functions(&__tcp_bbr, true, false);
 		break;
 	case MOD_UNLOAD:
 		err = deregister_tcp_functions(&__tcp_bbr, false, true);
 		if (err == EBUSY)
 			break;
 		if (bbr_mod_inited) {
 			uma_zdestroy(bbr_zone);
 			uma_zdestroy(bbr_pcb_zone);
 			sysctl_ctx_free(&bbr_sysctl_ctx);
 			bbr_counter_destroy();
 			printf(__XSTRING(MODNAME)
 			    " is now no longer available\n");
 			bbr_mod_inited = false;
 		}
 		tcp_lro_dereg_mbufq();
 		err = 0;
 		break;
 	default:
 		return (EOPNOTSUPP);
 	}
 	return (err);
 }
 
 static moduledata_t tcp_bbr = {
 	.name = __XSTRING(MODNAME),
 	    .evhand = tcp_addbbr,
 	    .priv = 0
 };
 
 MODULE_VERSION(MODNAME, 1);
 DECLARE_MODULE(MODNAME, tcp_bbr, SI_SUB_PROTO_DOMAIN, SI_ORDER_ANY);
 MODULE_DEPEND(MODNAME, tcphpts, 1, 1, 1);