diff --git a/sbin/dump/tape.c b/sbin/dump/tape.c
index 45ad0ee50487..c123f7fa9404 100644
--- a/sbin/dump/tape.c
+++ b/sbin/dump/tape.c
@@ -1,887 +1,901 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1980, 1991, 1993
  *	The Regents of the University of California.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #ifndef lint
 #if 0
 static char sccsid[] = "@(#)tape.c	8.4 (Berkeley) 5/1/95";
 #endif
 static const char rcsid[] =
   "$FreeBSD$";
 #endif /* not lint */
 
 #include <sys/param.h>
 #include <sys/socket.h>
 #include <sys/wait.h>
 #include <sys/stat.h>
 
 #include <ufs/ufs/dinode.h>
 #include <ufs/ffs/fs.h>
 
 #include <protocols/dumprestore.h>
 
 #include <assert.h>
 #include <errno.h>
 #include <fcntl.h>
 #include <limits.h>
 #include <setjmp.h>
 #include <signal.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <time.h>
 #include <unistd.h>
 
 #include "dump.h"
 
 ino_t	curino;			/* current inumber; used globally */
 int	newtape;		/* new tape flag */
 union	u_spcl u_spcl;		/* mapping of variables in a control block */
 
 static	int tapefd;		/* tape file descriptor */
 static	long asize;		/* number of 0.1" units written on cur tape */
 static	int writesize;		/* size of malloc()ed buffer for tape */
 static	int64_t lastspclrec = -1; /* tape block number of last written header */
 static	int trecno = 0;		/* next record to write in current block */
 static	long blocksthisvol;	/* number of blocks on current output file */
 static	char *nexttape;
 static	FILE *popenfp = NULL;
 
-static	int atomic(ssize_t (*)(), int, char *, int);
+static	int atomic_read(int, void *, int);
+static	int atomic_write(int, const void *, int);
 static	void worker(int, int);
 static	void create_workers(void);
 static	void flushtape(void);
 static	void killall(void);
 static	void rollforward(void);
 
 /*
  * Concurrent dump mods (Caltech) - disk block reading and tape writing
  * are exported to several worker processes.  While one worker writes the
  * tape, the others read disk blocks; they pass control of the tape in
  * a ring via signals. The parent process traverses the file system and
  * sends writeheader()'s and lists of daddr's to the workers via pipes.
  * The following structure defines the instruction packets sent to workers.
  */
 struct req {
 	ufs2_daddr_t dblk;
 	int count;
 };
 static int reqsiz;
 
 #define WORKERS 3		/* 1 worker writing, 1 reading, 1 for slack */
 static struct worker {
 	int64_t tapea;		/* header number at start of this chunk */
 	int64_t firstrec;	/* record number of this block */
 	int count;		/* count to next header (used for TS_TAPE */
 				/* after EOT) */
 	int inode;		/* inode that we are currently dealing with */
 	int fd;			/* FD for this worker */
 	int pid;		/* PID for this worker */
 	int sent;		/* 1 == we've sent this worker requests */
 	char (*tblock)[TP_BSIZE]; /* buffer for data blocks */
 	struct req *req;	/* buffer for requests */
 } workers[WORKERS+1];
 static struct worker *wp;
 
 static char	(*nextblock)[TP_BSIZE];
 
 static int master;	/* pid of master, for sending error signals */
 static int tenths;	/* length of tape used per block written */
 static volatile sig_atomic_t caught; /* have we caught the signal to proceed? */
 static volatile sig_atomic_t ready; /* reached the lock point without having */
 			/* received the SIGUSR2 signal from the prev worker? */
 static jmp_buf jmpbuf;	/* where to jump to if we are ready when the */
 			/* SIGUSR2 arrives from the previous worker */
 
 int
 alloctape(void)
 {
 	int pgoff = getpagesize() - 1;
 	char *buf;
 	int i;
 
 	writesize = ntrec * TP_BSIZE;
 	reqsiz = (ntrec + 1) * sizeof(struct req);
 	/*
 	 * CDC 92181's and 92185's make 0.8" gaps in 1600-bpi start/stop mode
 	 * (see DEC TU80 User's Guide).  The shorter gaps of 6250-bpi require
 	 * repositioning after stopping, i.e, streaming mode, where the gap is
 	 * variable, 0.30" to 0.45".  The gap is maximal when the tape stops.
 	 */
 	if (blocksperfile == 0 && !unlimited)
 		tenths = writesize / density +
 		    (cartridge ? 16 : density == 625 ? 5 : 8);
 	/*
 	 * Allocate tape buffer contiguous with the array of instruction
 	 * packets, so flushtape() can write them together with one write().
 	 * Align tape buffer on page boundary to speed up tape write().
 	 */
 	for (i = 0; i <= WORKERS; i++) {
 		buf = (char *)
 		    malloc((unsigned)(reqsiz + writesize + pgoff + TP_BSIZE));
 		if (buf == NULL)
 			return(0);
 		workers[i].tblock = (char (*)[TP_BSIZE])
 		    (((long)&buf[ntrec + 1] + pgoff) &~ pgoff);
 		workers[i].req = (struct req *)workers[i].tblock - ntrec - 1;
 	}
 	wp = &workers[0];
 	wp->count = 1;
 	wp->tapea = 0;
 	wp->firstrec = 0;
 	nextblock = wp->tblock;
 	return(1);
 }
 
 void
 writerec(char *dp, int isspcl)
 {
 
 	wp->req[trecno].dblk = (ufs2_daddr_t)0;
 	wp->req[trecno].count = 1;
 	/* Can't do a structure assignment due to alignment problems */
 	bcopy(dp, *(nextblock)++, sizeof (union u_spcl));
 	if (isspcl)
 		lastspclrec = spcl.c_tapea;
 	trecno++;
 	spcl.c_tapea++;
 	if (trecno >= ntrec)
 		flushtape();
 }
 
 void
 dumpblock(ufs2_daddr_t blkno, int size)
 {
 	int avail, tpblks;
 	ufs2_daddr_t dblkno;
 
 	dblkno = fsbtodb(sblock, blkno);
 	tpblks = size >> tp_bshift;
 	while ((avail = MIN(tpblks, ntrec - trecno)) > 0) {
 		wp->req[trecno].dblk = dblkno;
 		wp->req[trecno].count = avail;
 		trecno += avail;
 		spcl.c_tapea += avail;
 		if (trecno >= ntrec)
 			flushtape();
 		dblkno += avail << (tp_bshift - dev_bshift);
 		tpblks -= avail;
 	}
 }
 
 int	nogripe = 0;
 
 void
 tperror(int signo __unused)
 {
 
 	if (pipeout) {
 		msg("write error on %s\n", tape);
 		quit("Cannot recover\n");
 		/* NOTREACHED */
 	}
 	msg("write error %ld blocks into volume %d\n", blocksthisvol, tapeno);
 	broadcast("DUMP WRITE ERROR!\n");
 	if (!query("Do you want to restart?"))
 		dumpabort(0);
 	msg("Closing this volume.  Prepare to restart with new media;\n");
 	msg("this dump volume will be rewritten.\n");
 	killall();
 	nogripe = 1;
 	close_rewind();
 	Exit(X_REWRITE);
 }
 
 void
 sigpipe(int signo __unused)
 {
 
 	quit("Broken pipe\n");
 }
 
 static void
 flushtape(void)
 {
 	int i, blks, got;
 	int64_t lastfirstrec;
 
 	int siz = (char *)nextblock - (char *)wp->req;
 
 	wp->req[trecno].count = 0;			/* Sentinel */
 
-	if (atomic(write, wp->fd, (char *)wp->req, siz) != siz)
+	if (atomic_write(wp->fd, (const void *)wp->req, siz) != siz)
 		quit("error writing command pipe: %s\n", strerror(errno));
 	wp->sent = 1; /* we sent a request, read the response later */
 
 	lastfirstrec = wp->firstrec;
 
 	if (++wp >= &workers[WORKERS])
 		wp = &workers[0];
 
 	/* Read results back from next worker */
 	if (wp->sent) {
-		if (atomic(read, wp->fd, (char *)&got, sizeof got)
+		if (atomic_read(wp->fd, (void *)&got, sizeof got)
 		    != sizeof got) {
 			perror("  DUMP: error reading command pipe in master");
 			dumpabort(0);
 		}
 		wp->sent = 0;
 
 		/* Check for end of tape */
 		if (got < writesize) {
 			msg("End of tape detected\n");
 
 			/*
 			 * Drain the results, don't care what the values were.
 			 * If we read them here then trewind won't...
 			 */
 			for (i = 0; i < WORKERS; i++) {
 				if (workers[i].sent) {
-					if (atomic(read, workers[i].fd,
-					    (char *)&got, sizeof got)
+					if (atomic_read(workers[i].fd,
+					    (void *)&got, sizeof got)
 					    != sizeof got) {
 						perror("  DUMP: error reading command pipe in master");
 						dumpabort(0);
 					}
 					workers[i].sent = 0;
 				}
 			}
 
 			close_rewind();
 			rollforward();
 			return;
 		}
 	}
 
 	blks = 0;
 	if (spcl.c_type != TS_END && spcl.c_type != TS_CLRI &&
 	    spcl.c_type != TS_BITS) {
 		assert(spcl.c_count <= TP_NINDIR);
 		for (i = 0; i < spcl.c_count; i++)
 			if (spcl.c_addr[i] != 0)
 				blks++;
 	}
 	wp->count = lastspclrec + blks + 1 - spcl.c_tapea;
 	wp->tapea = spcl.c_tapea;
 	wp->firstrec = lastfirstrec + ntrec;
 	wp->inode = curino;
 	nextblock = wp->tblock;
 	trecno = 0;
 	asize += tenths;
 	blockswritten += ntrec;
 	blocksthisvol += ntrec;
 	if (!pipeout && !unlimited && (blocksperfile ?
 	    (blocksthisvol >= blocksperfile) : (asize > tsize))) {
 		close_rewind();
 		startnewtape(0);
 	}
 	timeest();
 }
 
 void
 trewind(void)
 {
 	struct stat sb;
 	int f;
 	int got;
 
 	for (f = 0; f < WORKERS; f++) {
 		/*
 		 * Drain the results, but unlike EOT we DO (or should) care
 		 * what the return values were, since if we detect EOT after
 		 * we think we've written the last blocks to the tape anyway,
 		 * we have to replay those blocks with rollforward.
 		 *
 		 * fixme: punt for now.
 		 */
 		if (workers[f].sent) {
-			if (atomic(read, workers[f].fd, (char *)&got, sizeof got)
+			if (atomic_read(workers[f].fd, (void *)&got, sizeof got)
 			    != sizeof got) {
 				perror("  DUMP: error reading command pipe in master");
 				dumpabort(0);
 			}
 			workers[f].sent = 0;
 			if (got != writesize) {
 				msg("EOT detected in last 2 tape records!\n");
 				msg("Use a longer tape, decrease the size estimate\n");
 				quit("or use no size estimate at all.\n");
 			}
 		}
 		(void) close(workers[f].fd);
 	}
 	while (wait((int *)NULL) >= 0)	/* wait for any signals from workers */
 		/* void */;
 
 	if (pipeout)
 		return;
 
 	msg("Closing %s\n", tape);
 
 	if (popenout) {
 		tapefd = -1;
 		(void)pclose(popenfp);
 		popenfp = NULL;
 		return;
 	}
 #ifdef RDUMP
 	if (host) {
 		rmtclose();
 		while (rmtopen(tape, 0) < 0)
 			sleep(10);
 		rmtclose();
 		return;
 	}
 #endif
 	if (fstat(tapefd, &sb) == 0 && S_ISFIFO(sb.st_mode)) {
 		(void)close(tapefd);
 		return;
 	}
 	(void) close(tapefd);
 	while ((f = open(tape, 0)) < 0)
 		sleep (10);
 	(void) close(f);
 }
 
 void
 close_rewind()
 {
 	time_t tstart_changevol, tend_changevol;
 
 	trewind();
 	if (nexttape)
 		return;
 	(void)time((time_t *)&(tstart_changevol));
 	if (!nogripe) {
 		msg("Change Volumes: Mount volume #%d\n", tapeno+1);
 		broadcast("CHANGE DUMP VOLUMES!\a\a\n");
 	}
 	while (!query("Is the new volume mounted and ready to go?"))
 		if (query("Do you want to abort?")) {
 			dumpabort(0);
 			/*NOTREACHED*/
 		}
 	(void)time((time_t *)&(tend_changevol));
 	if ((tstart_changevol != (time_t)-1) && (tend_changevol != (time_t)-1))
 		tstart_writing += (tend_changevol - tstart_changevol);
 }
 
 void
 rollforward(void)
 {
 	struct req *p, *q, *prev;
 	struct worker *twp;
 	int i, size, got;
 	int64_t savedtapea;
 	union u_spcl *ntb, *otb;
 	twp = &workers[WORKERS];
 	ntb = (union u_spcl *)twp->tblock[1];
 
 	/*
 	 * Each of the N workers should have requests that need to
 	 * be replayed on the next tape.  Use the extra worker buffers
 	 * (workers[WORKERS]) to construct request lists to be sent to
 	 * each worker in turn.
 	 */
 	for (i = 0; i < WORKERS; i++) {
 		q = &twp->req[1];
 		otb = (union u_spcl *)wp->tblock;
 
 		/*
 		 * For each request in the current worker, copy it to twp.
 		 */
 
 		prev = NULL;
 		for (p = wp->req; p->count > 0; p += p->count) {
 			*q = *p;
 			if (p->dblk == 0)
 				*ntb++ = *otb++; /* copy the datablock also */
 			prev = q;
 			q += q->count;
 		}
 		if (prev == NULL)
 			quit("rollforward: protocol botch");
 		if (prev->dblk != 0)
 			prev->count -= 1;
 		else
 			ntb--;
 		q -= 1;
 		q->count = 0;
 		q = &twp->req[0];
 		if (i == 0) {
 			q->dblk = 0;
 			q->count = 1;
 			trecno = 0;
 			nextblock = twp->tblock;
 			savedtapea = spcl.c_tapea;
 			spcl.c_tapea = wp->tapea;
 			startnewtape(0);
 			spcl.c_tapea = savedtapea;
 			lastspclrec = savedtapea - 1;
 		}
 		size = (char *)ntb - (char *)q;
-		if (atomic(write, wp->fd, (char *)q, size) != size) {
+		if (atomic_write(wp->fd, (const void *)q, size) != size) {
 			perror("  DUMP: error writing command pipe");
 			dumpabort(0);
 		}
 		wp->sent = 1;
 		if (++wp >= &workers[WORKERS])
 			wp = &workers[0];
 
 		q->count = 1;
 
 		if (prev->dblk != 0) {
 			/*
 			 * If the last one was a disk block, make the
 			 * first of this one be the last bit of that disk
 			 * block...
 			 */
 			q->dblk = prev->dblk +
 				prev->count * (TP_BSIZE / DEV_BSIZE);
 			ntb = (union u_spcl *)twp->tblock;
 		} else {
 			/*
 			 * It wasn't a disk block.  Copy the data to its
 			 * new location in the buffer.
 			 */
 			q->dblk = 0;
 			*((union u_spcl *)twp->tblock) = *ntb;
 			ntb = (union u_spcl *)twp->tblock[1];
 		}
 	}
 	wp->req[0] = *q;
 	nextblock = wp->tblock;
 	if (q->dblk == 0)
 		nextblock++;
 	trecno = 1;
 
 	/*
 	 * Clear the first workers' response.  One hopes that it
 	 * worked ok, otherwise the tape is much too short!
 	 */
 	if (wp->sent) {
-		if (atomic(read, wp->fd, (char *)&got, sizeof got)
+		if (atomic_read(wp->fd, (void *)&got, sizeof got)
 		    != sizeof got) {
 			perror("  DUMP: error reading command pipe in master");
 			dumpabort(0);
 		}
 		wp->sent = 0;
 
 		if (got != writesize) {
 			quit("EOT detected at start of the tape!\n");
 		}
 	}
 }
 
 /*
  * We implement taking and restoring checkpoints on the tape level.
  * When each tape is opened, a new process is created by forking; this
  * saves all of the necessary context in the parent.  The child
  * continues the dump; the parent waits around, saving the context.
  * If the child returns X_REWRITE, then it had problems writing that tape;
  * this causes the parent to fork again, duplicating the context, and
  * everything continues as if nothing had happened.
  */
 void
 startnewtape(int top)
 {
 	int	parentpid;
 	int	childpid;
 	int	status;
 	char	*p;
 	sig_t	interrupt_save;
 
 	interrupt_save = signal(SIGINT, SIG_IGN);
 	parentpid = getpid();
 
 restore_check_point:
 	(void)signal(SIGINT, interrupt_save);
 	/*
 	 *	All signals are inherited...
 	 */
 	setproctitle(NULL);	/* Restore the proctitle. */
 	childpid = fork();
 	if (childpid < 0) {
 		msg("Context save fork fails in parent %d\n", parentpid);
 		Exit(X_ABORT);
 	}
 	if (childpid != 0) {
 		/*
 		 *	PARENT:
 		 *	save the context by waiting
 		 *	until the child doing all of the work returns.
 		 *	don't catch the interrupt
 		 */
 		signal(SIGINT, SIG_IGN);
 #ifdef TDEBUG
 		msg("Tape: %d; parent process: %d child process %d\n",
 			tapeno+1, parentpid, childpid);
 #endif /* TDEBUG */
 		if (waitpid(childpid, &status, 0) == -1)
 			msg("Waiting for child %d: %s\n", childpid,
 			    strerror(errno));
 		if (status & 0xFF) {
 			msg("Child %d returns LOB status %o\n",
 				childpid, status&0xFF);
 		}
 		status = (status >> 8) & 0xFF;
 #ifdef TDEBUG
 		switch(status) {
 			case X_FINOK:
 				msg("Child %d finishes X_FINOK\n", childpid);
 				break;
 			case X_ABORT:
 				msg("Child %d finishes X_ABORT\n", childpid);
 				break;
 			case X_REWRITE:
 				msg("Child %d finishes X_REWRITE\n", childpid);
 				break;
 			default:
 				msg("Child %d finishes unknown %d\n",
 					childpid, status);
 				break;
 		}
 #endif /* TDEBUG */
 		switch(status) {
 			case X_FINOK:
 				Exit(X_FINOK);
 			case X_ABORT:
 				Exit(X_ABORT);
 			case X_REWRITE:
 				goto restore_check_point;
 			default:
 				msg("Bad return code from dump: %d\n", status);
 				Exit(X_ABORT);
 		}
 		/*NOTREACHED*/
 	} else {	/* we are the child; just continue */
 #ifdef TDEBUG
 		sleep(4);	/* allow time for parent's message to get out */
 		msg("Child on Tape %d has parent %d, my pid = %d\n",
 			tapeno+1, parentpid, getpid());
 #endif /* TDEBUG */
 		/*
 		 * If we have a name like "/dev/rmt0,/dev/rmt1",
 		 * use the name before the comma first, and save
 		 * the remaining names for subsequent volumes.
 		 */
 		tapeno++;               /* current tape sequence */
 		if (nexttape || strchr(tape, ',')) {
 			if (nexttape && *nexttape)
 				tape = nexttape;
 			if ((p = strchr(tape, ',')) != NULL) {
 				*p = '\0';
 				nexttape = p + 1;
 			} else
 				nexttape = NULL;
 			msg("Dumping volume %d on %s\n", tapeno, tape);
 		}
 		if (pipeout) {
 			tapefd = STDOUT_FILENO;
 		} else if (popenout) {
 			char volno[sizeof("2147483647")];
 
 			(void)sprintf(volno, "%d", spcl.c_volume + 1);
 			if (setenv("DUMP_VOLUME", volno, 1) == -1) {
 				msg("Cannot set $DUMP_VOLUME.\n");
 				dumpabort(0);
 			}
 			popenfp = popen(popenout, "w");
 			if (popenfp == NULL) {
 				msg("Cannot open output pipeline \"%s\".\n",
 				    popenout);
 				dumpabort(0);
 			}
 			tapefd = fileno(popenfp);
 		} else {
 #ifdef RDUMP
 			while ((tapefd = (host ? rmtopen(tape, 2) :
 				open(tape, O_WRONLY|O_CREAT, 0666))) < 0)
 #else
 			while ((tapefd =
 			    open(tape, O_WRONLY|O_CREAT, 0666)) < 0)
 #endif
 			    {
 				msg("Cannot open output \"%s\".\n", tape);
 				if (!query("Do you want to retry the open?"))
 					dumpabort(0);
 			}
 		}
 
 		create_workers();  /* Share open tape file descriptor with workers */
 		if (popenout)
 			close(tapefd);	/* Give up our copy of it. */
 		signal(SIGINFO, infosch);
 
 		asize = 0;
 		blocksthisvol = 0;
 		if (top)
 			newtape++;		/* new tape signal */
 		spcl.c_count = wp->count;
 		/*
 		 * measure firstrec in TP_BSIZE units since restore doesn't
 		 * know the correct ntrec value...
 		 */
 		spcl.c_firstrec = wp->firstrec;
 		spcl.c_volume++;
 		spcl.c_type = TS_TAPE;
 		writeheader((ino_t)wp->inode);
 		if (tapeno > 1)
 			msg("Volume %d begins with blocks from inode %d\n",
 				tapeno, wp->inode);
 	}
 }
 
 void
 dumpabort(int signo __unused)
 {
 
 	if (master != 0 && master != getpid())
 		/* Signals master to call dumpabort */
 		(void) kill(master, SIGTERM);
 	else {
 		killall();
 		msg("The ENTIRE dump is aborted.\n");
 	}
 #ifdef RDUMP
 	rmtclose();
 #endif
 	Exit(X_ABORT);
 }
 
 void
-Exit(status)
-	int status;
+Exit(int status)
 {
 
 #ifdef TDEBUG
 	msg("pid = %d exits with status %d\n", getpid(), status);
 #endif /* TDEBUG */
 	exit(status);
 }
 
 /*
  * proceed - handler for SIGUSR2, used to synchronize IO between the workers.
  */
 void
 proceed(int signo __unused)
 {
 
 	if (ready)
 		longjmp(jmpbuf, 1);
 	caught++;
 }
 
 void
 create_workers(void)
 {
 	int cmd[2];
 	int i, j;
 
 	master = getpid();
 
 	signal(SIGTERM, dumpabort);  /* Worker sends SIGTERM on dumpabort() */
 	signal(SIGPIPE, sigpipe);
 	signal(SIGUSR1, tperror);    /* Worker sends SIGUSR1 on tape errors */
 	signal(SIGUSR2, proceed);    /* Worker sends SIGUSR2 to next worker */
 
 	for (i = 0; i < WORKERS; i++) {
 		if (i == wp - &workers[0]) {
 			caught = 1;
 		} else {
 			caught = 0;
 		}
 
 		if (socketpair(AF_UNIX, SOCK_STREAM, 0, cmd) < 0 ||
 		    (workers[i].pid = fork()) < 0)
 			quit("too many workers, %d (recompile smaller): %s\n",
 			    i, strerror(errno));
 
 		workers[i].fd = cmd[1];
 		workers[i].sent = 0;
 		if (workers[i].pid == 0) { 	    /* Worker starts up here */
 			for (j = 0; j <= i; j++)
 			        (void) close(workers[j].fd);
 			signal(SIGINT, SIG_IGN);    /* Master handles this */
 			worker(cmd[0], i);
 			Exit(X_FINOK);
 		}
 	}
 
 	for (i = 0; i < WORKERS; i++)
-		(void) atomic(write, workers[i].fd,
-			      (char *) &workers[(i + 1) % WORKERS].pid,
+		(void) atomic_write(workers[i].fd,
+			      (const void *) &workers[(i + 1) % WORKERS].pid,
 		              sizeof workers[0].pid);
 
 	master = 0;
 }
 
 void
 killall(void)
 {
 	int i;
 
 	for (i = 0; i < WORKERS; i++)
 		if (workers[i].pid > 0) {
 			(void) kill(workers[i].pid, SIGKILL);
 			workers[i].sent = 0;
 		}
 }
 
 /*
  * Synchronization - each process has a lockfile, and shares file
  * descriptors to the following process's lockfile.  When our write
  * completes, we release our lock on the following process's lock-
  * file, allowing the following process to lock it and proceed. We
  * get the lock back for the next cycle by swapping descriptors.
  */
 static void
 worker(int cmd, int worker_number)
 {
 	int nread;
 	int nextworker, size, wrote, eot_count;
 
 	/*
 	 * Need our own seek pointer.
 	 */
 	(void) close(diskfd);
 	if ((diskfd = open(disk, O_RDONLY)) < 0)
 		quit("worker couldn't reopen disk: %s\n", strerror(errno));
 
 	/*
 	 * Need the pid of the next worker in the loop...
 	 */
-	if ((nread = atomic(read, cmd, (char *)&nextworker, sizeof nextworker))
+	if ((nread = atomic_read(cmd, (void *)&nextworker, sizeof nextworker))
 	    != sizeof nextworker) {
 		quit("master/worker protocol botched - didn't get pid of next worker.\n");
 	}
 
 	/*
 	 * Get list of blocks to dump, read the blocks into tape buffer
 	 */
-	while ((nread = atomic(read, cmd, (char *)wp->req, reqsiz)) == reqsiz) {
+	while ((nread = atomic_read(cmd, (void *)wp->req, reqsiz)) == reqsiz) {
 		struct req *p = wp->req;
 
 		for (trecno = 0; trecno < ntrec;
 		     trecno += p->count, p += p->count) {
 			if (p->dblk) {
 				blkread(p->dblk, wp->tblock[trecno],
 					p->count * TP_BSIZE);
 			} else {
-				if (p->count != 1 || atomic(read, cmd,
-				    (char *)wp->tblock[trecno],
+				if (p->count != 1 || atomic_read(cmd,
+				    (void *)wp->tblock[trecno],
 				    TP_BSIZE) != TP_BSIZE)
 				       quit("master/worker protocol botched.\n");
 			}
 		}
 		if (setjmp(jmpbuf) == 0) {
 			ready = 1;
 			if (!caught)
 				(void) pause();
 		}
 		ready = 0;
 		caught = 0;
 
 		/* Try to write the data... */
 		eot_count = 0;
 		size = 0;
 
 		wrote = 0;
 		while (eot_count < 10 && size < writesize) {
 #ifdef RDUMP
 			if (host)
 				wrote = rmtwrite(wp->tblock[0]+size,
 				    writesize-size);
 			else
 #endif
 				wrote = write(tapefd, wp->tblock[0]+size,
 				    writesize-size);
 #ifdef WRITEDEBUG
 			printf("worker %d wrote %d\n", worker_number, wrote);
 #endif
 			if (wrote < 0)
 				break;
 			if (wrote == 0)
 				eot_count++;
 			size += wrote;
 		}
 
 #ifdef WRITEDEBUG
 		if (size != writesize)
 		 printf("worker %d only wrote %d out of %d bytes and gave up.\n",
 		     worker_number, size, writesize);
 #endif
 
 		/*
 		 * Handle ENOSPC as an EOT condition.
 		 */
 		if (wrote < 0 && errno == ENOSPC) {
 			wrote = 0;
 			eot_count++;
 		}
 
 		if (eot_count > 0)
 			size = 0;
 
 		if (wrote < 0) {
 			(void) kill(master, SIGUSR1);
 			for (;;)
 				(void) sigpause(0);
 		} else {
 			/*
 			 * pass size of write back to master
 			 * (for EOT handling)
 			 */
-			(void) atomic(write, cmd, (char *)&size, sizeof size);
+			(void)atomic_write(cmd, (const void *)&size,
+			    sizeof size);
 		}
 
 		/*
 		 * If partial write, don't want next worker to go.
 		 * Also jolts him awake.
 		 */
 		(void) kill(nextworker, SIGUSR2);
 	}
 	if (nread != 0)
 		quit("error reading command pipe: %s\n", strerror(errno));
 }
 
 /*
  * Since a read from a pipe may not return all we asked for,
- * or a write may not write all we ask if we get a signal,
  * loop until the count is satisfied (or error).
  */
 static int
-atomic(ssize_t (*func)(), int fd, char *buf, int count)
+atomic_read(int fd, void *buf, int count)
 {
 	int got, need = count;
 
-	while ((got = (*func)(fd, buf, need)) > 0 && (need -= got) > 0)
+	while ((got = read(fd, buf, need)) > 0 && (need -= got) > 0)
+		buf += got;
+	return (got < 0 ? got : count - need);
+}
+
+/*
+ * Since a write to a pipe may not write all we ask if we get a signal,
+ * loop until the count is satisfied (or error).
+ */
+static int
+atomic_write(int fd, const void *buf, int count)
+{
+	int got, need = count;
+
+	while ((got = write(fd, buf, need)) > 0 && (need -= got) > 0)
 		buf += got;
 	return (got < 0 ? got : count - need);
 }
diff --git a/sbin/fsck_ffs/dir.c b/sbin/fsck_ffs/dir.c
index 18229ab96fb6..64e477c66ed8 100644
--- a/sbin/fsck_ffs/dir.c
+++ b/sbin/fsck_ffs/dir.c
@@ -1,928 +1,933 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1980, 1986, 1993
  *	The Regents of the University of California.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #if 0
 #ifndef lint
 static const char sccsid[] = "@(#)dir.c	8.8 (Berkeley) 4/28/95";
 #endif /* not lint */
 #endif
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/time.h>
 #include <sys/types.h>
 #include <sys/sysctl.h>
 
 #include <ufs/ufs/dinode.h>
 #include <ufs/ufs/dir.h>
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <string.h>
 
 #include "fsck.h"
 
 static struct	dirtemplate emptydir = {
 	0, DIRBLKSIZ, DT_UNKNOWN, 0, "",
 	0, 0, DT_UNKNOWN, 0, ""
 };
 static struct	dirtemplate dirhead = {
 	0, 12, DT_DIR, 1, ".",
 	0, DIRBLKSIZ - 12, DT_DIR, 2, ".."
 };
 
 static int chgino(struct inodesc *);
 static int dircheck(struct inodesc *, struct bufarea *, struct direct *);
 static int expanddir(struct inode *ip, char *name);
 static struct direct *fsck_readdir(struct inodesc *);
 static struct bufarea *getdirblk(ufs2_daddr_t blkno, long size);
 static int lftempname(char *bufp, ino_t ino);
 static int mkentry(struct inodesc *);
 
 /*
  * Propagate connected state through the tree.
  */
 void
 propagate(void)
 {
 	struct inoinfo **inpp, *inp;
 	struct inoinfo **inpend;
 	long change;
 
 	inpend = &inpsort[inplast];
 	do {
 		change = 0;
 		for (inpp = inpsort; inpp < inpend; inpp++) {
 			inp = *inpp;
 			if (inp->i_parent == 0)
 				continue;
 			if (inoinfo(inp->i_parent)->ino_state == DFOUND &&
 			    INO_IS_DUNFOUND(inp->i_number)) {
 				inoinfo(inp->i_number)->ino_state = DFOUND;
 				change++;
 			}
 		}
 	} while (change > 0);
 }
 
 /*
  * Scan each entry in a directory block.
  */
 int
 dirscan(struct inodesc *idesc)
 {
 	struct direct *dp;
 	struct bufarea *bp;
 	u_int dsize, n;
 	long blksiz;
 	char dbuf[DIRBLKSIZ];
 
 	if (idesc->id_type != DATA)
 		errx(EEXIT, "wrong type to dirscan %d", idesc->id_type);
 	if (idesc->id_entryno == 0 &&
 	    (idesc->id_filesize & (DIRBLKSIZ - 1)) != 0)
 		idesc->id_filesize = roundup(idesc->id_filesize, DIRBLKSIZ);
 	blksiz = idesc->id_numfrags * sblock.fs_fsize;
 	if (chkrange(idesc->id_blkno, idesc->id_numfrags)) {
 		idesc->id_filesize -= blksiz;
 		return (SKIP);
 	}
 	idesc->id_loc = 0;
 	for (dp = fsck_readdir(idesc); dp != NULL; dp = fsck_readdir(idesc)) {
 		dsize = dp->d_reclen;
 		if (dsize > sizeof(dbuf))
 			dsize = sizeof(dbuf);
 		memmove(dbuf, dp, (size_t)dsize);
 		idesc->id_dirp = (struct direct *)dbuf;
 		if ((n = (*idesc->id_func)(idesc)) & ALTERED) {
 			bp = getdirblk(idesc->id_blkno, blksiz);
 			if (bp->b_errs != 0)
 				return (STOP);
 			memmove(bp->b_un.b_buf + idesc->id_loc - dsize, dbuf,
 			    (size_t)dsize);
 			dirty(bp);
 			sbdirty();
 		}
 		if (n & STOP)
 			return (n);
 	}
 	return (idesc->id_filesize > 0 ? KEEPON : STOP);
 }
 
 /*
  * Get and verify the next entry in a directory.
  * We also verify that if there is another entry in the block that it is
  * valid, so if it is not valid it can be subsumed into the current entry. 
  */
 static struct direct *
 fsck_readdir(struct inodesc *idesc)
 {
 	struct direct *dp, *ndp;
 	struct bufarea *bp;
 	long size, blksiz, subsume_ndp;
 
 	subsume_ndp = 0;
 	blksiz = idesc->id_numfrags * sblock.fs_fsize;
 	if (idesc->id_filesize <= 0 || idesc->id_loc >= blksiz)
 		return (NULL);
 	bp = getdirblk(idesc->id_blkno, blksiz);
 	if (bp->b_errs != 0)
 		return (NULL);
 	dp = (struct direct *)(bp->b_un.b_buf + idesc->id_loc);
 	/*
 	 * Only need to check current entry if it is the first in the
 	 * the block, as later entries will have been checked in the
 	 * previous call to this function.
 	 */
 	if (idesc->id_loc % DIRBLKSIZ != 0 || dircheck(idesc, bp, dp) != 0) {
 		/*
 		 * Current entry is good, update to point at next.
 		 */
 		idesc->id_loc += dp->d_reclen;
 		idesc->id_filesize -= dp->d_reclen;
 		/*
 		 * If at end of directory block, just return this entry.
 		 */
 		if (idesc->id_filesize <= 0 || idesc->id_loc >= blksiz ||
 		    idesc->id_loc % DIRBLKSIZ == 0)
 			return (dp);
 		/*
 		 * If the next entry good, return this entry.
 		 */
 		ndp = (struct direct *)(bp->b_un.b_buf + idesc->id_loc);
 		if (dircheck(idesc, bp, ndp) != 0)
 			return (dp);
 		/*
 		 * The next entry is bad, so subsume it and the remainder
 		 * of this directory block into this entry.
 		 */
 		subsume_ndp = 1;
 	}
 	/*
 	 * Current or next entry is bad. Zap current entry or
 	 * subsume next entry into current entry as appropriate.
 	 */
 	size = DIRBLKSIZ - (idesc->id_loc % DIRBLKSIZ);
 	idesc->id_loc += size;
 	idesc->id_filesize -= size;
 	if (idesc->id_fix == IGNORE)
 		return (NULL);
 	if (subsume_ndp) {
 		memset(ndp, 0, size);
 		dp->d_reclen += size;
 	} else {
 		memset(dp, 0, size);
 		dp->d_reclen = size;
 	}
 	if (dofix(idesc, "DIRECTORY CORRUPTED"))
 		dirty(bp);
 	return (dp);
 }
 
 /*
  * Verify that a directory entry is valid.
  * This is a superset of the checks made in the kernel.
  * Also optionally clears padding and unused directory space.
  *
  * Returns 0 if the entry is bad, 1 if the entry is good.
  */
 static int
 dircheck(struct inodesc *idesc, struct bufarea *bp, struct direct *dp)
 {
 	size_t size;
 	char *cp;
 	u_int8_t namlen;
 	int spaceleft, modified, unused;
 
 	spaceleft = DIRBLKSIZ - (idesc->id_loc % DIRBLKSIZ);
 	size = DIRSIZ(0, dp);
 	if (dp->d_reclen == 0 ||
 	    dp->d_reclen > spaceleft ||
 	    dp->d_reclen < size ||
 	    idesc->id_filesize < size ||
 	    (dp->d_reclen & (DIR_ROUNDUP - 1)) != 0)
 		goto bad;
 	modified = 0;
 	if (dp->d_ino == 0) {
 		if (!zflag || fswritefd < 0)
 			return (1);
 		/*
 		 * Special case of an unused directory entry. Normally only
 		 * occurs at the beginning of a directory block when the block
 		 * contains no entries. Other than the first entry in a
 		 * directory block, the kernel coalesces unused space with
 		 * the previous entry by extending its d_reclen. However,
 		 * when cleaning up a directory, fsck may set d_ino to zero
 		 * in the middle of a directory block. If we're clearing out
 		 * directory cruft (-z flag), then make sure that all directory
 		 * space in entries with d_ino == 0 gets fully cleared.
 		 */
 		if (dp->d_type != 0) {
 			dp->d_type = 0;
 			modified = 1;
 		}
 		if (dp->d_namlen != 0) {
 			dp->d_namlen = 0;
 			modified = 1;
 		}
 		unused = dp->d_reclen - __offsetof(struct direct, d_name);
 		for (cp = dp->d_name; unused > 0; unused--, cp++) {
 			if (*cp != '\0') {
 				*cp = '\0';
 				modified = 1;
 			}
 		}
 		if (modified)
 			dirty(bp);
 		return (1);
 	}
 	/*
 	 * The d_type field should not be tested here. A bad type is an error
 	 * in the entry itself but is not a corruption of the directory
 	 * structure itself. So blowing away all the remaining entries in the
 	 * directory block is inappropriate. Rather the type error should be
 	 * checked in pass1 and fixed there.
 	 *
 	 * The name validation should also be done in pass1 although the
 	 * check to see if the name is longer than fits in the space
 	 * allocated for it (i.e., the *cp != '\0' fails after exiting the
 	 * loop below) then it really is a structural error that requires
 	 * the stronger action taken here.
 	 */
 	namlen = dp->d_namlen;
 	if (namlen == 0 || dp->d_type > 15)
 		goto bad;
 	for (cp = dp->d_name, size = 0; size < namlen; size++) {
 		if (*cp == '\0' || *cp++ == '/')
 			goto bad;
 	}
 	if (*cp != '\0')
 		goto bad;
 	if (zflag && fswritefd >= 0) {
 		/*
 		 * Clear unused directory entry space, including the d_name
 		 * padding.
 		 */
 		/* First figure the number of pad bytes. */
 		unused = roundup2(namlen + 1, DIR_ROUNDUP) - (namlen + 1);
 
 		/* Add in the free space to the end of the record. */
 		unused += dp->d_reclen - DIRSIZ(0, dp);
 
 		/*
 		 * Now clear out the unused space, keeping track if we actually
 		 * changed anything.
 		 */
 		for (cp = &dp->d_name[namlen + 1]; unused > 0; unused--, cp++) {
 			if (*cp != '\0') {
 				*cp = '\0';
 				modified = 1;
 			}
 		}
 		
 		if (modified)
 			dirty(bp);
 	}
 	return (1);
 
 bad:
 	if (debug)
 		printf("Bad dir: ino %d reclen %d namlen %d type %d name %s\n",
 		    dp->d_ino, dp->d_reclen, dp->d_namlen, dp->d_type,
 		    dp->d_name);
 	return (0);
 }
 
 void
 direrror(ino_t ino, const char *errmesg)
 {
 
 	fileerror(ino, ino, errmesg);
 }
 
 void
 fileerror(ino_t cwd, ino_t ino, const char *errmesg)
 {
 	struct inode ip;
 	union dinode *dp;
 	char pathbuf[MAXPATHLEN + 1];
 
 	pwarn("%s ", errmesg);
 	if (ino < UFS_ROOTINO || ino > maxino) {
 		pfatal("out-of-range inode number %ju", (uintmax_t)ino);
 		return;
 	}
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	prtinode(&ip);
 	printf("\n");
 	getpathname(pathbuf, cwd, ino);
 	if (ftypeok(dp))
 		pfatal("%s=%s\n",
 		    (DIP(dp, di_mode) & IFMT) == IFDIR ? "DIR" : "FILE",
 		    pathbuf);
 	else
 		pfatal("NAME=%s\n", pathbuf);
 	irelse(&ip);
 }
 
 void
 adjust(struct inodesc *idesc, int lcnt)
 {
 	struct inode ip;
 	union dinode *dp;
 	int saveresolved;
 
 	ginode(idesc->id_number, &ip);
 	dp = ip.i_dp;
 	if (DIP(dp, di_nlink) == lcnt) {
 		/*
 		 * If we have not hit any unresolved problems, are running
 		 * in preen mode, and are on a file system using soft updates,
 		 * then just toss any partially allocated files.
 		 */
 		if (resolved && (preen || bkgrdflag) && usedsoftdep) {
 			clri(idesc, "UNREF", 1);
 			irelse(&ip);
 			return;
 		} else {
 			/*
 			 * The file system can be marked clean even if
 			 * a file is not linked up, but is cleared.
 			 * Hence, resolved should not be cleared when
 			 * linkup is answered no, but clri is answered yes.
 			 */
 			saveresolved = resolved;
 			if (linkup(idesc->id_number, (ino_t)0, NULL) == 0) {
 				resolved = saveresolved;
 				clri(idesc, "UNREF", 0);
 				irelse(&ip);
 				return;
 			}
 			/*
 			 * Account for the new reference created by linkup().
 			 */
 			lcnt--;
 		}
 	}
 	if (lcnt != 0) {
 		pwarn("LINK COUNT %s", (lfdir == idesc->id_number) ? lfname :
 			((DIP(dp, di_mode) & IFMT) == IFDIR ? "DIR" : "FILE"));
 		prtinode(&ip);
 		printf(" COUNT %d SHOULD BE %d",
 			DIP(dp, di_nlink), DIP(dp, di_nlink) - lcnt);
 		if (preen || usedsoftdep) {
 			if (lcnt < 0) {
 				printf("\n");
 				pfatal("LINK COUNT INCREASING");
 			}
 			if (preen)
 				printf(" (ADJUSTED)\n");
 		}
 		if (preen || reply("ADJUST") == 1) {
 			if (bkgrdflag == 0) {
 				DIP_SET(dp, di_nlink, DIP(dp, di_nlink) - lcnt);
 				inodirty(&ip);
 			} else {
 				cmd.value = idesc->id_number;
 				cmd.size = -lcnt;
 				if (debug)
 					printf("adjrefcnt ino %ld amt %lld\n",
 					    (long)cmd.value,
 					    (long long)cmd.size);
 				if (sysctl(adjrefcnt, MIBSIZE, 0, 0,
 				    &cmd, sizeof cmd) == -1)
 					rwerror("ADJUST INODE", cmd.value);
 			}
 		}
 	}
 	irelse(&ip);
 }
 
 static int
 mkentry(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 	struct direct newent;
 	int newlen, oldlen;
 
 	newent.d_namlen = strlen(idesc->id_name);
 	newlen = DIRSIZ(0, &newent);
 	if (dirp->d_ino != 0)
 		oldlen = DIRSIZ(0, dirp);
 	else
 		oldlen = 0;
 	if (dirp->d_reclen - oldlen < newlen)
 		return (KEEPON);
 	newent.d_reclen = dirp->d_reclen - oldlen;
 	dirp->d_reclen = oldlen;
 	dirp = (struct direct *)(((char *)dirp) + oldlen);
 	dirp->d_ino = idesc->id_parent;	/* ino to be entered is in id_parent */
 	dirp->d_reclen = newent.d_reclen;
 	dirp->d_type = inoinfo(idesc->id_parent)->ino_type;
 	dirp->d_namlen = newent.d_namlen;
 	memmove(dirp->d_name, idesc->id_name, (size_t)newent.d_namlen + 1);
 	return (ALTERED|STOP);
 }
 
 static int
 chgino(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 
 	if (memcmp(dirp->d_name, idesc->id_name, (int)dirp->d_namlen + 1))
 		return (KEEPON);
 	dirp->d_ino = idesc->id_parent;
 	dirp->d_type = inoinfo(idesc->id_parent)->ino_type;
 	return (ALTERED|STOP);
 }
 
 int
 linkup(ino_t orphan, ino_t parentdir, char *name)
 {
 	struct inode ip;
 	union dinode *dp;
 	int lostdir;
 	ino_t oldlfdir;
 	struct inoinfo *inp;
 	struct inodesc idesc;
 	char tempname[BUFSIZ];
 
 	memset(&idesc, 0, sizeof(struct inodesc));
 	ginode(orphan, &ip);
 	dp = ip.i_dp;
 	lostdir = (DIP(dp, di_mode) & IFMT) == IFDIR;
 	pwarn("UNREF %s ", lostdir ? "DIR" : "FILE");
 	prtinode(&ip);
 	printf("\n");
 	if (preen && DIP(dp, di_size) == 0) {
 		irelse(&ip);
 		return (0);
 	}
 	irelse(&ip);
 	if (cursnapshot != 0) {
 		pfatal("FILE LINKUP IN SNAPSHOT");
 		return (0);
 	}
 	if (preen)
 		printf(" (RECONNECTED)\n");
 	else if (reply("RECONNECT") == 0)
 		return (0);
 	if (lfdir == 0) {
 		ginode(UFS_ROOTINO, &ip);
 		idesc.id_name = strdup(lfname);
 		idesc.id_type = DATA;
 		idesc.id_func = findino;
 		idesc.id_number = UFS_ROOTINO;
 		if ((ckinode(ip.i_dp, &idesc) & FOUND) != 0) {
 			lfdir = idesc.id_parent;
 		} else {
 			pwarn("NO lost+found DIRECTORY");
 			if (preen || reply("CREATE")) {
 				lfdir = allocdir(UFS_ROOTINO, (ino_t)0, lfmode);
 				if (lfdir != 0) {
 					if (makeentry(UFS_ROOTINO, lfdir,
 					    lfname) != 0) {
 						numdirs++;
 						if (preen)
 							printf(" (CREATED)\n");
 					} else {
 						freedirino(lfdir, UFS_ROOTINO);
 						lfdir = 0;
 						if (preen)
 							printf("\n");
 					}
 				}
 			}
 		}
 		irelse(&ip);
+		free(idesc.id_name);
 		if (lfdir == 0) {
 			pfatal("SORRY. CANNOT CREATE lost+found DIRECTORY");
 			printf("\n\n");
 			return (0);
 		}
 	}
 	ginode(lfdir, &ip);
 	dp = ip.i_dp;
 	if ((DIP(dp, di_mode) & IFMT) != IFDIR) {
 		pfatal("lost+found IS NOT A DIRECTORY");
 		if (reply("REALLOCATE") == 0) {
 			irelse(&ip);
 			return (0);
 		}
 		oldlfdir = lfdir;
 		if ((lfdir = allocdir(UFS_ROOTINO, (ino_t)0, lfmode)) == 0) {
 			pfatal("SORRY. CANNOT CREATE lost+found DIRECTORY\n\n");
 			irelse(&ip);
 			return (0);
 		}
 		if ((changeino(UFS_ROOTINO, lfname, lfdir) & ALTERED) == 0) {
 			pfatal("SORRY. CANNOT CREATE lost+found DIRECTORY\n\n");
 			irelse(&ip);
 			return (0);
 		}
 		idesc.id_type = inoinfo(oldlfdir)->ino_idtype;
 		idesc.id_func = freeblock;
 		idesc.id_number = oldlfdir;
 		adjust(&idesc, inoinfo(oldlfdir)->ino_linkcnt + 1);
 		inoinfo(oldlfdir)->ino_linkcnt = 0;
 		inodirty(&ip);
 		irelse(&ip);
 		ginode(lfdir, &ip);
 		dp = ip.i_dp;
 	}
 	if (inoinfo(lfdir)->ino_state != DFOUND) {
 		pfatal("SORRY. NO lost+found DIRECTORY\n\n");
 		irelse(&ip);
 		return (0);
 	}
 	(void)lftempname(tempname, orphan);
 	if (makeentry(lfdir, orphan, (name ? name : tempname)) == 0) {
 		pfatal("SORRY. NO SPACE IN lost+found DIRECTORY");
 		printf("\n\n");
 		irelse(&ip);
 		return (0);
 	}
 	inoinfo(orphan)->ino_linkcnt--;
 	if (lostdir) {
 		if ((changeino(orphan, "..", lfdir) & ALTERED) == 0 &&
 		    parentdir != (ino_t)-1)
 			(void)makeentry(orphan, lfdir, "..");
 		DIP_SET(dp, di_nlink, DIP(dp, di_nlink) + 1);
 		inodirty(&ip);
 		inoinfo(lfdir)->ino_linkcnt++;
 		pwarn("DIR I=%lu CONNECTED. ", (u_long)orphan);
 		inp = getinoinfo(parentdir);
 		if (parentdir != (ino_t)-1 && inp != NULL) {
 			printf("PARENT WAS I=%lu\n", (u_long)parentdir);
 			/*
 			 * If the parent directory did not have to
 			 * be replaced then because of the ordering
 			 * guarantees, has had the link count incremented
 			 * for the child, but no entry was made.  This
 			 * fixes the parent link count so that fsck does
 			 * not need to be rerun.
 			 */
 			if ((inp->i_flags & INFO_NEW) != 0)
 				inoinfo(parentdir)->ino_linkcnt++;
 		}
 		if (preen == 0)
 			printf("\n");
 	}
 	irelse(&ip);
 	return (1);
 }
 
 /*
  * fix an entry in a directory.
  */
 int
 changeino(ino_t dir, const char *name, ino_t newnum)
 {
 	struct inodesc idesc;
 	struct inode ip;
 	int error;
 
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_type = DATA;
 	idesc.id_func = chgino;
 	idesc.id_number = dir;
 	idesc.id_fix = DONTKNOW;
 	idesc.id_name = strdup(name);
 	idesc.id_parent = newnum;	/* new value for name */
 	ginode(dir, &ip);
 	error = ckinode(ip.i_dp, &idesc);
+	free(idesc.id_name);
 	irelse(&ip);
 	return (error);
 }
 
 /*
  * make an entry in a directory
  */
 int
 makeentry(ino_t parent, ino_t ino, const char *name)
 {
 	struct inode ip;
 	union dinode *dp;
 	struct inodesc idesc;
 	int retval;
 	char pathbuf[MAXPATHLEN + 1];
 
 	if (parent < UFS_ROOTINO || parent >= maxino ||
 	    ino < UFS_ROOTINO || ino >= maxino)
 		return (0);
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_type = DATA;
 	idesc.id_func = mkentry;
 	idesc.id_number = parent;
 	idesc.id_parent = ino;	/* this is the inode to enter */
 	idesc.id_fix = DONTKNOW;
 	idesc.id_name = strdup(name);
 	ginode(parent, &ip);
 	dp = ip.i_dp;
 	if (DIP(dp, di_size) % DIRBLKSIZ) {
 		DIP_SET(dp, di_size, roundup(DIP(dp, di_size), DIRBLKSIZ));
 		inodirty(&ip);
 	}
 	if ((ckinode(dp, &idesc) & ALTERED) != 0) {
 		irelse(&ip);
+		free(idesc.id_name);
 		return (1);
 	}
 	getpathname(pathbuf, parent, parent);
 	if (expanddir(&ip, pathbuf) == 0) {
 		irelse(&ip);
+		free(idesc.id_name);
 		return (0);
 	}
 	retval = ckinode(dp, &idesc) & ALTERED;
 	irelse(&ip);
+	free(idesc.id_name);
 	return (retval);
 }
 
 /*
  * Attempt to expand the size of a directory
  */
 static int
 expanddir(struct inode *ip, char *name)
 {
 	ufs2_daddr_t lastlbn, oldblk, newblk, indirblk;
 	size_t filesize, lastlbnsize;
 	struct bufarea *bp, *nbp;
 	struct inodesc idesc;
 	union dinode *dp;
 	long cg, indiralloced;
 	char *cp;
 
 	nbp = NULL;
 	indiralloced = newblk = indirblk = 0;
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_type = ADDR;
 	pwarn("NO SPACE LEFT IN %s", name);
 	if (!preen && reply("EXPAND") == 0)
 		return (0);
 	cg = ino_to_cg(&sblock, ip->i_number);
 	dp = ip->i_dp;
 	filesize = DIP(dp, di_size);
 	lastlbn = lblkno(&sblock, filesize);
 	/*
 	 * We only expand lost+found to a single indirect block.
 	 */
 	if ((DIP(dp, di_mode) & IFMT) != IFDIR || filesize == 0 ||
 	    lastlbn >= UFS_NDADDR + NINDIR(&sblock))
 		goto bad;
 	/*
 	 * If last block is a fragment, expand it to a full size block.
 	 */
 	lastlbnsize = sblksize(&sblock, filesize, lastlbn);
 	if (lastlbnsize > 0 && lastlbnsize < sblock.fs_bsize) {
 		oldblk = DIP(dp, di_db[lastlbn]);
 		bp = getdirblk(oldblk, lastlbnsize);
 		if (bp->b_errs)
 			goto bad;
 		newblk = allocblk(cg, sblock.fs_frag, std_checkblkavail);
 		if (newblk == 0)
 			goto bad;
 		nbp = getdatablk(newblk, sblock.fs_bsize, BT_DIRDATA);
 		if (nbp->b_errs)
 			goto bad;
 		DIP_SET(dp, di_db[lastlbn], newblk);
 		DIP_SET(dp, di_size, filesize + sblock.fs_bsize - lastlbnsize);
 		DIP_SET(dp, di_blocks, DIP(dp, di_blocks) +
 		    btodb(sblock.fs_bsize - lastlbnsize));
 		inodirty(ip);
 		memmove(nbp->b_un.b_buf, bp->b_un.b_buf, lastlbnsize);
 		memset(&nbp->b_un.b_buf[lastlbnsize], 0,
 		    sblock.fs_bsize - lastlbnsize);
 		for (cp = &nbp->b_un.b_buf[lastlbnsize];
 		     cp < &nbp->b_un.b_buf[sblock.fs_bsize];
 		     cp += DIRBLKSIZ)
 			memmove(cp, &emptydir, sizeof emptydir);
 		dirty(nbp);
 		brelse(nbp);
 		binval(bp);
 		idesc.id_blkno = oldblk;
 		idesc.id_numfrags = numfrags(&sblock, lastlbnsize);
 		(void)freeblock(&idesc);
 		if (preen)
 			printf(" (EXPANDED)\n");
 		return (1);
 	}
 	if ((newblk = allocblk(cg, sblock.fs_frag, std_checkblkavail)) == 0)
 		goto bad;
 	bp = getdirblk(newblk, sblock.fs_bsize);
 	if (bp->b_errs)
 		goto bad;
 	memset(bp->b_un.b_buf, 0, sblock.fs_bsize);
 	for (cp = bp->b_un.b_buf;
 	     cp < &bp->b_un.b_buf[sblock.fs_bsize];
 	     cp += DIRBLKSIZ)
 		memmove(cp, &emptydir, sizeof emptydir);
 	dirty(bp);
 	if (lastlbn < UFS_NDADDR) {
 		DIP_SET(dp, di_db[lastlbn], newblk);
 	} else {
 		/*
 		 * Allocate indirect block if needed.
 		 */
 		if ((indirblk = DIP(dp, di_ib[0])) == 0) {
 			indirblk = allocblk(cg, sblock.fs_frag,
 			    std_checkblkavail);
 			if (indirblk == 0) {
 				binval(bp);
 				goto bad;
 			}
 			indiralloced = 1;
 		}
 		nbp = getdatablk(indirblk, sblock.fs_bsize, BT_LEVEL1);
 		if (nbp->b_errs)
 			goto bad;
 		if (indiralloced) {
 			memset(nbp->b_un.b_buf, 0, sblock.fs_bsize);
 			DIP_SET(dp, di_ib[0], indirblk);
 			DIP_SET(dp, di_blocks,
 			    DIP(dp, di_blocks) + btodb(sblock.fs_bsize));
 		}
 		IBLK_SET(nbp, lastlbn - UFS_NDADDR, newblk);
 		dirty(nbp);
 		brelse(nbp);
 	}
 	DIP_SET(dp, di_size, filesize + sblock.fs_bsize);
 	DIP_SET(dp, di_blocks, DIP(dp, di_blocks) + btodb(sblock.fs_bsize));
 	inodirty(ip);
 	if (preen)
 		printf(" (EXPANDED)\n");
 	return (1);
 bad:
 	pfatal(" (EXPANSION FAILED)\n");
 	if (nbp != NULL) {
 		binval(bp);
 		brelse(nbp);
 	}
 	if (newblk != 0) {
 		idesc.id_blkno = newblk;
 		idesc.id_numfrags = sblock.fs_frag;
 		(void)freeblock(&idesc);
 	}
 	if (indiralloced) {
 		idesc.id_blkno = indirblk;
 		idesc.id_numfrags = sblock.fs_frag;
 		(void)freeblock(&idesc);
 	}
 	return (0);
 }
 
 /*
  * allocate a new directory
  */
 ino_t
 allocdir(ino_t parent, ino_t request, int mode)
 {
 	ino_t ino;
 	char *cp;
 	struct inode ip;
 	union dinode *dp;
 	struct bufarea *bp;
 	struct inoinfo *inp;
 	struct dirtemplate *dirp;
 
 	ino = allocino(request, IFDIR|mode);
 	if (ino == 0)
 		return (0);
 	dirp = &dirhead;
 	dirp->dot_ino = ino;
 	dirp->dotdot_ino = parent;
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	bp = getdirblk(DIP(dp, di_db[0]), sblock.fs_fsize);
 	if (bp->b_errs) {
 		freeino(ino);
 		irelse(&ip);
 		return (0);
 	}
 	memmove(bp->b_un.b_buf, dirp, sizeof(struct dirtemplate));
 	for (cp = &bp->b_un.b_buf[DIRBLKSIZ];
 	     cp < &bp->b_un.b_buf[sblock.fs_fsize];
 	     cp += DIRBLKSIZ)
 		memmove(cp, &emptydir, sizeof emptydir);
 	dirty(bp);
 	DIP_SET(dp, di_nlink, 2);
 	inodirty(&ip);
 	if (ino == UFS_ROOTINO) {
 		inp = cacheino(dp, ino);
 		inp->i_parent = parent;
 		inp->i_dotdot = parent;
 		inp->i_flags |= INFO_NEW;
 		inoinfo(ino)->ino_type = DT_DIR;
 		inoinfo(ino)->ino_linkcnt = DIP(dp, di_nlink);
 		irelse(&ip);
 		return(ino);
 	}
 	if (!INO_IS_DVALID(parent)) {
 		freeino(ino);
 		irelse(&ip);
 		return (0);
 	}
 	inp = cacheino(dp, ino);
 	inp->i_parent = parent;
 	inp->i_dotdot = parent;
 	inp->i_flags |= INFO_NEW;
 	inoinfo(ino)->ino_type = DT_DIR;
 	inoinfo(ino)->ino_state = inoinfo(parent)->ino_state;
 	if (inoinfo(ino)->ino_state == DSTATE) {
 		inoinfo(ino)->ino_linkcnt = DIP(dp, di_nlink);
 		inoinfo(parent)->ino_linkcnt++;
 	}
 	irelse(&ip);
 	ginode(parent, &ip);
 	dp = ip.i_dp;
 	DIP_SET(dp, di_nlink, DIP(dp, di_nlink) + 1);
 	inodirty(&ip);
 	irelse(&ip);
 	return (ino);
 }
 
 /*
  * free a directory inode
  */
 void
 freedirino(ino_t ino, ino_t parent)
 {
 	struct inode ip;
 	union dinode *dp;
 
 	if (ino != parent) {
 		ginode(parent, &ip);
 		dp = ip.i_dp;
 		DIP_SET(dp, di_nlink, DIP(dp, di_nlink) - 1);
 		inodirty(&ip);
 		irelse(&ip);
 	}
 	removecachedino(ino);
 	freeino(ino);
 }
 
 /*
  * generate a temporary name for the lost+found directory.
  */
 static int
 lftempname(char *bufp, ino_t ino)
 {
 	ino_t in;
 	char *cp;
 	int namlen;
 
 	cp = bufp + 2;
 	for (in = maxino; in > 0; in /= 10)
 		cp++;
 	*--cp = 0;
 	namlen = cp - bufp;
 	in = ino;
 	while (cp > bufp) {
 		*--cp = (in % 10) + '0';
 		in /= 10;
 	}
 	*cp = '#';
 	return (namlen);
 }
 
 /*
  * Get a directory block.
  * Insure that it is held until another is requested.
  */
 static struct bufarea *
 getdirblk(ufs2_daddr_t blkno, long size)
 {
 
 	if (pdirbp != NULL && pdirbp->b_errs == 0)
 		brelse(pdirbp);
 	pdirbp = getdatablk(blkno, size, BT_DIRDATA);
 	return (pdirbp);
 }
diff --git a/sbin/fsck_ffs/fsutil.c b/sbin/fsck_ffs/fsutil.c
index d8842e7d41f2..44b3e50da012 100644
--- a/sbin/fsck_ffs/fsutil.c
+++ b/sbin/fsck_ffs/fsutil.c
@@ -1,1469 +1,1469 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1980, 1986, 1993
  *	The Regents of the University of California.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #if 0
 #ifndef lint
 static const char sccsid[] = "@(#)utilities.c	8.6 (Berkeley) 5/19/95";
 #endif /* not lint */
 #endif
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/time.h>
 #include <sys/types.h>
 #include <sys/sysctl.h>
 #include <sys/disk.h>
 #include <sys/disklabel.h>
 #include <sys/ioctl.h>
 #include <sys/stat.h>
 
 #include <ufs/ufs/dinode.h>
 #include <ufs/ufs/dir.h>
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <errno.h>
 #include <string.h>
 #include <ctype.h>
 #include <fstab.h>
 #include <stdint.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <time.h>
 #include <unistd.h>
 #include <libufs.h>
 
 #include "fsck.h"
 
 int		sujrecovery = 0;
 
 static struct bufarea *allocbuf(const char *);
 static void cg_write(struct bufarea *);
 static void slowio_start(void);
 static void slowio_end(void);
 static void printIOstats(void);
 
 static long diskreads, totaldiskreads, totalreads; /* Disk cache statistics */
 static struct timespec startpass, finishpass;
 struct timeval slowio_starttime;
 int slowio_delay_usec = 10000;	/* Initial IO delay for background fsck */
 int slowio_pollcnt;
 static struct bufarea cgblk;	/* backup buffer for cylinder group blocks */
 static struct bufarea failedbuf; /* returned by failed getdatablk() */
 static TAILQ_HEAD(bufqueue, bufarea) bufqueuehd; /* head of buffer cache LRU */
 static LIST_HEAD(bufhash, bufarea) bufhashhd[HASHSIZE]; /* buffer hash list */
 static struct bufhash freebufs;	/* unused buffers */
 static int numbufs;		/* size of buffer cache */
 static int cachelookups;	/* number of cache lookups */
 static int cachereads;		/* number of cache reads */
 static int flushtries;		/* number of tries to reclaim memory */
 
 char *buftype[BT_NUMBUFTYPES] = BT_NAMES;
 
 void
 fsutilinit(void)
 {
 	diskreads = totaldiskreads = totalreads = 0;
 	bzero(&startpass, sizeof(struct timespec));
 	bzero(&finishpass, sizeof(struct timespec));
 	bzero(&slowio_starttime, sizeof(struct timeval));
 	slowio_delay_usec = 10000;
 	slowio_pollcnt = 0;
 	flushtries = 0;
 }
 
 int
 ftypeok(union dinode *dp)
 {
 	switch (DIP(dp, di_mode) & IFMT) {
 
 	case IFDIR:
 	case IFREG:
 	case IFBLK:
 	case IFCHR:
 	case IFLNK:
 	case IFSOCK:
 	case IFIFO:
 		return (1);
 
 	default:
 		if (debug)
 			printf("bad file type 0%o\n", DIP(dp, di_mode));
 		return (0);
 	}
 }
 
 int
 reply(const char *question)
 {
 	int persevere;
 	char c;
 
 	if (preen)
 		pfatal("INTERNAL ERROR: GOT TO reply()");
 	persevere = !strcmp(question, "CONTINUE");
 	printf("\n");
 	if (!persevere && (nflag || (fswritefd < 0 && bkgrdflag == 0))) {
 		printf("%s? no\n\n", question);
 		resolved = 0;
 		return (0);
 	}
 	if (yflag || (persevere && nflag)) {
 		printf("%s? yes\n\n", question);
 		return (1);
 	}
 	do	{
 		printf("%s? [yn] ", question);
 		(void) fflush(stdout);
 		c = getc(stdin);
 		while (c != '\n' && getc(stdin) != '\n') {
 			if (feof(stdin)) {
 				resolved = 0;
 				return (0);
 			}
 		}
 	} while (c != 'y' && c != 'Y' && c != 'n' && c != 'N');
 	printf("\n");
 	if (c == 'y' || c == 'Y')
 		return (1);
 	resolved = 0;
 	return (0);
 }
 
 /*
  * Look up state information for an inode.
  */
 struct inostat *
 inoinfo(ino_t inum)
 {
 	static struct inostat unallocated = { USTATE, 0, 0, 0 };
 	struct inostatlist *ilp;
 	int iloff;
 
 	if (inum > maxino)
 		errx(EEXIT, "inoinfo: inumber %ju out of range",
 		    (uintmax_t)inum);
 	ilp = &inostathead[inum / sblock.fs_ipg];
 	iloff = inum % sblock.fs_ipg;
 	if (iloff >= ilp->il_numalloced)
 		return (&unallocated);
 	return (&ilp->il_stat[iloff]);
 }
 
 /*
  * Malloc buffers and set up cache.
  */
 void
 bufinit(void)
 {
 	int i;
 
 	initbarea(&failedbuf, BT_UNKNOWN);
 	failedbuf.b_errs = -1;
 	failedbuf.b_un.b_buf = NULL;
 	if ((cgblk.b_un.b_buf = Malloc((unsigned int)sblock.fs_bsize)) == NULL)
 		errx(EEXIT, "Initial malloc(%d) failed", sblock.fs_bsize);
 	initbarea(&cgblk, BT_CYLGRP);
 	numbufs = cachelookups = cachereads = 0;
 	TAILQ_INIT(&bufqueuehd);
 	LIST_INIT(&freebufs);
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_INIT(&bufhashhd[i]);
 	for (i = 0; i < BT_NUMBUFTYPES; i++) {
 		readtime[i].tv_sec = totalreadtime[i].tv_sec = 0;
 		readtime[i].tv_nsec = totalreadtime[i].tv_nsec = 0;
 		readcnt[i] = totalreadcnt[i] = 0;
 	}
 }
 
 static struct bufarea *
 allocbuf(const char *failreason)
 {
 	struct bufarea *bp;
 	char *bufp;
 
 	bp = (struct bufarea *)Malloc(sizeof(struct bufarea));
 	bufp = Malloc((unsigned int)sblock.fs_bsize);
 	if (bp == NULL || bufp == NULL) {
 		errx(EEXIT, "%s", failreason);
 		/* NOTREACHED */
 	}
 	numbufs++;
 	bp->b_un.b_buf = bufp;
 	TAILQ_INSERT_HEAD(&bufqueuehd, bp, b_list);
 	initbarea(bp, BT_UNKNOWN);
 	return (bp);
 }
 
 /*
  * Manage cylinder group buffers.
  *
  * Use getblk() here rather than cgget() because the cylinder group
  * may be corrupted but we want it anyway so we can fix it.
  */
 static struct bufarea *cgbufs;	/* header for cylinder group cache */
 static int flushtries;		/* number of tries to reclaim memory */
 
 struct bufarea *
 cglookup(int cg)
 {
 	struct bufarea *cgbp;
 	struct cg *cgp;
 
 	if ((unsigned) cg >= sblock.fs_ncg)
 		errx(EEXIT, "cglookup: out of range cylinder group %d", cg);
 	if (cgbufs == NULL) {
 		cgbufs = calloc(sblock.fs_ncg, sizeof(struct bufarea));
 		if (cgbufs == NULL)
 			errx(EEXIT, "Cannot allocate cylinder group buffers");
 	}
 	cgbp = &cgbufs[cg];
 	if (cgbp->b_un.b_cg != NULL)
 		return (cgbp);
 	cgp = NULL;
 	if (flushtries == 0)
 		cgp = Malloc((unsigned int)sblock.fs_cgsize);
 	if (cgp == NULL) {
 		if (sujrecovery)
 			errx(EEXIT,"Ran out of memory during journal recovery");
 		flush(fswritefd, &cgblk);
 		getblk(&cgblk, cgtod(&sblock, cg), sblock.fs_cgsize);
 		return (&cgblk);
 	}
 	cgbp->b_un.b_cg = cgp;
 	initbarea(cgbp, BT_CYLGRP);
 	getblk(cgbp, cgtod(&sblock, cg), sblock.fs_cgsize);
 	return (cgbp);
 }
 
 /*
  * Mark a cylinder group buffer as dirty.
  * Update its check-hash if they are enabled.
  */
 void
 cgdirty(struct bufarea *cgbp)
 {
 	struct cg *cg;
 
 	cg = cgbp->b_un.b_cg;
 	if ((sblock.fs_metackhash & CK_CYLGRP) != 0) {
 		cg->cg_ckhash = 0;
 		cg->cg_ckhash =
 		    calculate_crc32c(~0L, (void *)cg, sblock.fs_cgsize);
 	}
 	dirty(cgbp);
 }
 
 /*
  * Attempt to flush a cylinder group cache entry.
  * Return whether the flush was successful.
  */
 int
 flushentry(void)
 {
 	struct bufarea *cgbp;
 
 	if (sujrecovery || flushtries == sblock.fs_ncg || cgbufs == NULL)
 		return (0);
 	cgbp = &cgbufs[flushtries++];
 	if (cgbp->b_un.b_cg == NULL)
 		return (0);
 	flush(fswritefd, cgbp);
 	free(cgbp->b_un.b_buf);
 	cgbp->b_un.b_buf = NULL;
 	return (1);
 }
 
 /*
  * Manage a cache of filesystem disk blocks.
  */
 struct bufarea *
 getdatablk(ufs2_daddr_t blkno, long size, int type)
 {
 	struct bufarea *bp;
 	struct bufhash *bhdp;
 
 	cachelookups++;
 	/*
 	 * If out of range, return empty buffer with b_err == -1
 	 *
 	 * Skip check for inodes because chkrange() considers
 	 * metadata areas invalid to write data.
 	 */
 	if (type != BT_INODES && chkrange(blkno, size / sblock.fs_fsize))
 		return (&failedbuf);
 	bhdp = &bufhashhd[HASH(blkno)];
 	LIST_FOREACH(bp, bhdp, b_hash)
 		if (bp->b_bno == fsbtodb(&sblock, blkno)) {
 			if (debug && bp->b_size != size) {
 				prtbuf(bp, "getdatablk: size mismatch");
 				pfatal("getdatablk: b_size %d != size %ld\n",
 				    bp->b_size, size);
 			}
 			TAILQ_REMOVE(&bufqueuehd, bp, b_list);
 			goto foundit;
 		}
 	/*
 	 * Move long-term busy buffer back to the front of the LRU so we 
 	 * do not endless inspect them for recycling.
 	 */
 	bp = TAILQ_LAST(&bufqueuehd, bufqueue);
 	if (bp != NULL && bp->b_refcnt != 0) {
 		TAILQ_REMOVE(&bufqueuehd, bp, b_list);
 		TAILQ_INSERT_HEAD(&bufqueuehd, bp, b_list);
 	}
 	/*
 	 * Allocate up to the minimum number of buffers before
 	 * considering recycling any of them.
 	 */
 	if (size > sblock.fs_bsize)
 		errx(EEXIT, "Excessive buffer size %ld > %d\n", size,
 		    sblock.fs_bsize);
 	if ((bp = LIST_FIRST(&freebufs)) != NULL) {
 		LIST_REMOVE(bp, b_hash);
 	} else if (numbufs < MINBUFS) {
 		bp = allocbuf("cannot create minimal buffer pool");
 	} else if (sujrecovery) {
 		/*
 		 * SUJ recovery does not want anything written until it 
 		 * has successfully completed (so it can fail back to
 		 * full fsck). Thus, we can only recycle clean buffers.
 		 */
 		TAILQ_FOREACH_REVERSE(bp, &bufqueuehd, bufqueue, b_list)
 			if ((bp->b_flags & B_DIRTY) == 0 && bp->b_refcnt == 0)
 				break;
 		if (bp == NULL)
 			bp = allocbuf("Ran out of memory during "
 			    "journal recovery");
 		else
 			LIST_REMOVE(bp, b_hash);
 	} else {
 		/*
 		 * Recycle oldest non-busy buffer.
 		 */
 		TAILQ_FOREACH_REVERSE(bp, &bufqueuehd, bufqueue, b_list)
 			if (bp->b_refcnt == 0)
 				break;
 		if (bp == NULL)
 			bp = allocbuf("Ran out of memory for buffers");
 		else
 			LIST_REMOVE(bp, b_hash);
 	}
 	TAILQ_REMOVE(&bufqueuehd, bp, b_list);
 	flush(fswritefd, bp);
 	bp->b_type = type;
 	LIST_INSERT_HEAD(bhdp, bp, b_hash);
 	getblk(bp, blkno, size);
 	cachereads++;
 	/* fall through */
 foundit:
 	TAILQ_INSERT_HEAD(&bufqueuehd, bp, b_list);
 	if (debug && bp->b_type != type) {
 		printf("getdatablk: buffer type changed to %s",
 		    BT_BUFTYPE(type));
 		prtbuf(bp, "");
 	}
 	if (bp->b_errs == 0)
 		bp->b_refcnt++;
 	return (bp);
 }
 
 void
 getblk(struct bufarea *bp, ufs2_daddr_t blk, long size)
 {
 	ufs2_daddr_t dblk;
 	struct timespec start, finish;
 
 	dblk = fsbtodb(&sblock, blk);
 	if (bp->b_bno == dblk) {
 		totalreads++;
 	} else {
 		if (debug) {
 			readcnt[bp->b_type]++;
 			clock_gettime(CLOCK_REALTIME_PRECISE, &start);
 		}
 		bp->b_errs = blread(fsreadfd, bp->b_un.b_buf, dblk, size);
 		if (debug) {
 			clock_gettime(CLOCK_REALTIME_PRECISE, &finish);
 			timespecsub(&finish, &start, &finish);
 			timespecadd(&readtime[bp->b_type], &finish,
 			    &readtime[bp->b_type]);
 		}
 		bp->b_bno = dblk;
 		bp->b_size = size;
 	}
 }
 
 void
 brelse(struct bufarea *bp)
 {
 
 	if (bp->b_refcnt <= 0)
 		prtbuf(bp, "brelse: buffer with negative reference count");
 	bp->b_refcnt--;
 }
 
 void
 binval(struct bufarea *bp)
 {
 
 	bp->b_flags &= ~B_DIRTY;
 	LIST_REMOVE(bp, b_hash);
 	LIST_INSERT_HEAD(&freebufs, bp, b_hash);
 }
 
 void
 flush(int fd, struct bufarea *bp)
 {
 	struct inode ip;
 
 	if ((bp->b_flags & B_DIRTY) == 0)
 		return;
 	bp->b_flags &= ~B_DIRTY;
 	if (fswritefd < 0) {
 		pfatal("WRITING IN READ_ONLY MODE.\n");
 		return;
 	}
 	if (bp->b_errs != 0)
 		pfatal("WRITING %sZERO'ED BLOCK %lld TO DISK\n",
 		    (bp->b_errs == bp->b_size / dev_bsize) ? "" : "PARTIALLY ",
 		    (long long)bp->b_bno);
 	bp->b_errs = 0;
 	/*
 	 * Write using the appropriate function.
 	 */
 	switch (bp->b_type) {
 	case BT_SUPERBLK:
 		if (bp != &sblk)
 			pfatal("BUFFER %p DOES NOT MATCH SBLK %p\n",
 			    bp, &sblk);
 		/*
 		 * Superblocks are always pre-copied so we do not need
 		 * to check them for copy-on-write.
 		 */
 		if (sbput(fd, bp->b_un.b_fs, 0) == 0)
 			fsmodified = 1;
 		break;
 	case BT_CYLGRP:
 		/*
 		 * Cylinder groups are always pre-copied so we do not
 		 * need to check them for copy-on-write.
 		 */
 		if (sujrecovery)
 			cg_write(bp);
 		if (cgput(fswritefd, &sblock, bp->b_un.b_cg) == 0)
 			fsmodified = 1;
 		break;
 	case BT_INODES:
 		if (debug && sblock.fs_magic == FS_UFS2_MAGIC) {
 			struct ufs2_dinode *dp = bp->b_un.b_dinode2;
 			int i;
 
 			for (i = 0; i < bp->b_size; dp++, i += sizeof(*dp)) {
 				if (ffs_verify_dinode_ckhash(&sblock, dp) == 0)
 					continue;
 				pwarn("flush: INODE CHECK-HASH FAILED");
 				ip.i_bp = bp;
 				ip.i_dp = (union dinode *)dp;
 				ip.i_number = bp->b_index + (i / sizeof(*dp));
 				prtinode(&ip);
 				if (preen || reply("FIX") != 0) {
 					if (preen)
 						printf(" (FIXED)\n");
 					ffs_update_dinode_ckhash(&sblock, dp);
 					inodirty(&ip);
 				}
 			}
 		}
 		/* FALLTHROUGH */
 	default:
 		copyonwrite(&sblock, bp, std_checkblkavail);
 		blwrite(fd, bp->b_un.b_buf, bp->b_bno, bp->b_size);
 		break;
 	}
 }
 
 /*
  * If there are any snapshots, ensure that all the blocks that they
  * care about have been copied, then release the snapshot inodes.
  * These operations need to be done before we rebuild the cylinder
  * groups so that any block allocations are properly recorded.
  * Since all the cylinder group maps have already been copied in
  * the snapshots, no further snapshot copies will need to be done.
  */
 void
 snapflush(ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t, long))
 {
 	struct bufarea *bp;
 	int cnt;
 
 	if (snapcnt > 0) {
 		if (debug)
 			printf("Check for snapshot copies\n");
 		TAILQ_FOREACH_REVERSE(bp, &bufqueuehd, bufqueue, b_list)
 			if ((bp->b_flags & B_DIRTY) != 0)
 				copyonwrite(&sblock, bp, checkblkavail);
 		for (cnt = 0; cnt < snapcnt; cnt++)
 			irelse(&snaplist[cnt]);
 		snapcnt = 0;
 	}
 }
 
 /*
  * Journaled soft updates does not maintain cylinder group summary
  * information during cleanup, so this routine recalculates the summary
  * information and updates the superblock summary in preparation for
  * writing out the cylinder group.
  */
 static void
 cg_write(struct bufarea *bp)
 {
 	ufs1_daddr_t fragno, cgbno, maxbno;
 	u_int8_t *blksfree;
 	struct csum *csp;
 	struct cg *cgp;
 	int blk;
 	int i;
 
 	/*
 	 * Fix the frag and cluster summary.
 	 */
 	cgp = bp->b_un.b_cg;
 	cgp->cg_cs.cs_nbfree = 0;
 	cgp->cg_cs.cs_nffree = 0;
 	bzero(&cgp->cg_frsum, sizeof(cgp->cg_frsum));
 	maxbno = fragstoblks(&sblock, sblock.fs_fpg);
 	if (sblock.fs_contigsumsize > 0) {
 		for (i = 1; i <= sblock.fs_contigsumsize; i++)
 			cg_clustersum(cgp)[i] = 0;
 		bzero(cg_clustersfree(cgp), howmany(maxbno, CHAR_BIT));
 	}
 	blksfree = cg_blksfree(cgp);
 	for (cgbno = 0; cgbno < maxbno; cgbno++) {
 		if (ffs_isfreeblock(&sblock, blksfree, cgbno))
 			continue;
 		if (ffs_isblock(&sblock, blksfree, cgbno)) {
 			ffs_clusteracct(&sblock, cgp, cgbno, 1);
 			cgp->cg_cs.cs_nbfree++;
 			continue;
 		}
 		fragno = blkstofrags(&sblock, cgbno);
 		blk = blkmap(&sblock, blksfree, fragno);
 		ffs_fragacct(&sblock, blk, cgp->cg_frsum, 1);
 		for (i = 0; i < sblock.fs_frag; i++)
 			if (isset(blksfree, fragno + i))
 				cgp->cg_cs.cs_nffree++;
 	}
 	/*
 	 * Update the superblock cg summary from our now correct values
 	 * before writing the block.
 	 */
 	csp = &sblock.fs_cs(&sblock, cgp->cg_cgx);
 	sblock.fs_cstotal.cs_ndir += cgp->cg_cs.cs_ndir - csp->cs_ndir;
 	sblock.fs_cstotal.cs_nbfree += cgp->cg_cs.cs_nbfree - csp->cs_nbfree;
 	sblock.fs_cstotal.cs_nifree += cgp->cg_cs.cs_nifree - csp->cs_nifree;
 	sblock.fs_cstotal.cs_nffree += cgp->cg_cs.cs_nffree - csp->cs_nffree;
 	sblock.fs_cs(&sblock, cgp->cg_cgx) = cgp->cg_cs;
 }
 
 void
 rwerror(const char *mesg, ufs2_daddr_t blk)
 {
 
 	if (bkgrdcheck)
 		exit(EEXIT);
 	if (preen == 0)
 		printf("\n");
 	pfatal("CANNOT %s: %ld", mesg, (long)blk);
 	if (reply("CONTINUE") == 0)
 		exit(EEXIT);
 }
 
 void
 ckfini(int markclean)
 {
 	struct bufarea *bp, *nbp;
 	int ofsmodified, cnt, cg;
 
 	if (bkgrdflag) {
 		unlink(snapname);
 		if ((!(sblock.fs_flags & FS_UNCLEAN)) != markclean) {
 			cmd.value = FS_UNCLEAN;
 			cmd.size = markclean ? -1 : 1;
 			if (sysctlbyname("vfs.ffs.setflags", 0, 0,
 			    &cmd, sizeof cmd) == -1)
 				pwarn("CANNOT SET FILE SYSTEM DIRTY FLAG\n");
 			if (!preen) {
 				printf("\n***** FILE SYSTEM MARKED %s *****\n",
 				    markclean ? "CLEAN" : "DIRTY");
 				if (!markclean)
 					rerun = 1;
 			}
 		} else if (!preen && !markclean) {
 			printf("\n***** FILE SYSTEM STILL DIRTY *****\n");
 			rerun = 1;
 		}
 		bkgrdflag = 0;
 	}
 	if (debug && cachelookups > 0)
 		printf("cache with %d buffers missed %d of %d (%d%%)\n",
 		    numbufs, cachereads, cachelookups,
 		    (int)(cachereads * 100 / cachelookups));
 	if (fswritefd < 0) {
 		(void)close(fsreadfd);
 		return;
 	}
 
 	/*
 	 * To remain idempotent with partial truncations the buffers
 	 * must be flushed in this order:
 	 *  1) cylinder groups (bitmaps)
 	 *  2) indirect, directory, external attribute, and data blocks
 	 *  3) inode blocks
 	 *  4) superblock
 	 * This ordering preserves access to the modified pointers
 	 * until they are freed.
 	 */
 	/* Step 1: cylinder groups */
 	if (debug)
 		printf("Flush Cylinder groups\n");
 	if (cgbufs != NULL) {
 		for (cnt = 0; cnt < sblock.fs_ncg; cnt++) {
 			if (cgbufs[cnt].b_un.b_cg == NULL)
 				continue;
 			flush(fswritefd, &cgbufs[cnt]);
 			free(cgbufs[cnt].b_un.b_cg);
 		}
 		free(cgbufs);
 		cgbufs = NULL;
 	}
 	flush(fswritefd, &cgblk);
 	free(cgblk.b_un.b_buf);
 	cgblk.b_un.b_buf = NULL;
 	cnt = 0;
 	/* Step 2: indirect, directory, external attribute, and data blocks */
 	if (debug)
 		printf("Flush indirect, directory, external attribute, "
 		    "and data blocks\n");
 	if (pdirbp != NULL) {
 		brelse(pdirbp);
 		pdirbp = NULL;
 	}
 	TAILQ_FOREACH_REVERSE_SAFE(bp, &bufqueuehd, bufqueue, b_list, nbp) {
 		switch (bp->b_type) {
 		/* These should not be in the buffer cache list */
 		case BT_UNKNOWN:
 		case BT_SUPERBLK:
 		case BT_CYLGRP:
 		default:
 			prtbuf(bp,"ckfini: improper buffer type on cache list");
 			continue;
 		/* These are the ones to flush in this step */
 		case BT_LEVEL1:
 		case BT_LEVEL2:
 		case BT_LEVEL3:
 		case BT_EXTATTR:
 		case BT_DIRDATA:
 		case BT_DATA:
 			break;
 		/* These are the ones to flush in the next step */
 		case BT_INODES:
 			continue;
 		}
 		if (debug && bp->b_refcnt != 0)
 			prtbuf(bp, "ckfini: clearing in-use buffer");
 		TAILQ_REMOVE(&bufqueuehd, bp, b_list);
 		LIST_REMOVE(bp, b_hash);
 		cnt++;
 		flush(fswritefd, bp);
 		free(bp->b_un.b_buf);
 		free((char *)bp);
 	}
 	/* Step 3: inode blocks */
 	if (debug)
 		printf("Flush inode blocks\n");
 	if (icachebp != NULL) {
 		brelse(icachebp);
 		icachebp = NULL;
 	}
 	TAILQ_FOREACH_REVERSE_SAFE(bp, &bufqueuehd, bufqueue, b_list, nbp) {
 		if (debug && bp->b_refcnt != 0)
 			prtbuf(bp, "ckfini: clearing in-use buffer");
 		TAILQ_REMOVE(&bufqueuehd, bp, b_list);
 		LIST_REMOVE(bp, b_hash);
 		cnt++;
 		flush(fswritefd, bp);
 		free(bp->b_un.b_buf);
 		free((char *)bp);
 	}
 	if (numbufs != cnt)
 		errx(EEXIT, "panic: lost %d buffers", numbufs - cnt);
 	/* Step 4: superblock */
 	if (debug)
 		printf("Flush the superblock\n");
 	flush(fswritefd, &sblk);
 	if (havesb && cursnapshot == 0 &&
 	    sblk.b_bno != sblock.fs_sblockloc / dev_bsize) {
 		if (preen || reply("UPDATE STANDARD SUPERBLOCK")) {
 			/* Change write destination to standard superblock */
 			sblock.fs_sblockactualloc = sblock.fs_sblockloc;
 			sblk.b_bno = sblock.fs_sblockloc / dev_bsize;
 			sbdirty();
 			flush(fswritefd, &sblk);
 		} else {
 			markclean = 0;
 		}
 	}
 	if (cursnapshot == 0 && sblock.fs_clean != markclean) {
 		if ((sblock.fs_clean = markclean) != 0) {
 			sblock.fs_flags &= ~(FS_UNCLEAN | FS_NEEDSFSCK);
 			sblock.fs_pendingblocks = 0;
 			sblock.fs_pendinginodes = 0;
 		}
 		sbdirty();
 		ofsmodified = fsmodified;
 		flush(fswritefd, &sblk);
 		fsmodified = ofsmodified;
 		if (!preen) {
 			printf("\n***** FILE SYSTEM MARKED %s *****\n",
 			    markclean ? "CLEAN" : "DIRTY");
 			if (!markclean)
 				rerun = 1;
 		}
 	} else if (!preen) {
 		if (markclean) {
 			printf("\n***** FILE SYSTEM IS CLEAN *****\n");
 		} else {
 			printf("\n***** FILE SYSTEM STILL DIRTY *****\n");
 			rerun = 1;
 		}
 	}
 	/*
 	 * Free allocated tracking structures.
 	 */
 	if (blockmap != NULL)
 		free(blockmap);
 	blockmap = NULL;
 	if (inostathead != NULL) {
 		for (cg = 0; cg < sblock.fs_ncg; cg++)
 			if (inostathead[cg].il_stat != NULL)
 				free((char *)inostathead[cg].il_stat);
 		free(inostathead);
 	}
 	inostathead = NULL;
 	inocleanup();
 	finalIOstats();
 	(void)close(fsreadfd);
 	(void)close(fswritefd);
 }
 
 /*
  * Print out I/O statistics.
  */
 void
 IOstats(char *what)
 {
 	int i;
 
 	if (debug == 0)
 		return;
 	if (diskreads == 0) {
 		printf("%s: no I/O\n\n", what);
 		return;
 	}
 	if (startpass.tv_sec == 0)
 		startpass = startprog;
 	printf("%s: I/O statistics\n", what);
 	printIOstats();
 	totaldiskreads += diskreads;
 	diskreads = 0;
 	for (i = 0; i < BT_NUMBUFTYPES; i++) {
 		timespecadd(&totalreadtime[i], &readtime[i], &totalreadtime[i]);
 		totalreadcnt[i] += readcnt[i];
 		readtime[i].tv_sec = readtime[i].tv_nsec = 0;
 		readcnt[i] = 0;
 	}
 	clock_gettime(CLOCK_REALTIME_PRECISE, &startpass);
 }
 
 void
 finalIOstats(void)
 {
 	int i;
 
 	if (debug == 0)
 		return;
 	printf("Final I/O statistics\n");
 	totaldiskreads += diskreads;
 	diskreads = totaldiskreads;
 	startpass = startprog;
 	for (i = 0; i < BT_NUMBUFTYPES; i++) {
 		timespecadd(&totalreadtime[i], &readtime[i], &totalreadtime[i]);
 		totalreadcnt[i] += readcnt[i];
 		readtime[i] = totalreadtime[i];
 		readcnt[i] = totalreadcnt[i];
 	}
 	printIOstats();
 }
 
 static void printIOstats(void)
 {
 	long long msec, totalmsec;
 	int i;
 
 	clock_gettime(CLOCK_REALTIME_PRECISE, &finishpass);
 	timespecsub(&finishpass, &startpass, &finishpass);
 	printf("Running time: %jd.%03ld sec\n",
 		(intmax_t)finishpass.tv_sec, finishpass.tv_nsec / 1000000);
 	printf("buffer reads by type:\n");
 	for (totalmsec = 0, i = 0; i < BT_NUMBUFTYPES; i++)
 		totalmsec += readtime[i].tv_sec * 1000 +
 		    readtime[i].tv_nsec / 1000000;
 	if (totalmsec == 0)
 		totalmsec = 1;
 	for (i = 0; i < BT_NUMBUFTYPES; i++) {
 		if (readcnt[i] == 0)
 			continue;
 		msec =
 		    readtime[i].tv_sec * 1000 + readtime[i].tv_nsec / 1000000;
 		printf("%21s:%8ld %2ld.%ld%% %4jd.%03ld sec %2lld.%lld%%\n",
 		    buftype[i], readcnt[i], readcnt[i] * 100 / diskreads,
 		    (readcnt[i] * 1000 / diskreads) % 10,
 		    (intmax_t)readtime[i].tv_sec, readtime[i].tv_nsec / 1000000,
 		    msec * 100 / totalmsec, (msec * 1000 / totalmsec) % 10);
 	}
 	printf("\n");
 }
 
 int
 blread(int fd, char *buf, ufs2_daddr_t blk, long size)
 {
 	char *cp;
 	int i, errs;
 	off_t offset;
 
 	offset = blk;
 	offset *= dev_bsize;
 	if (bkgrdflag)
 		slowio_start();
 	totalreads++;
 	diskreads++;
 	if (pread(fd, buf, (int)size, offset) == size) {
 		if (bkgrdflag)
 			slowio_end();
 		return (0);
 	}
 
 	/*
 	 * This is handled specially here instead of in rwerror because
 	 * rwerror is used for all sorts of errors, not just true read/write
 	 * errors.  It should be refactored and fixed.
 	 */
 	if (surrender) {
 		pfatal("CANNOT READ_BLK: %ld", (long)blk);
 		errx(EEXIT, "ABORTING DUE TO READ ERRORS");
 	} else
 		rwerror("READ BLK", blk);
 
 	errs = 0;
 	memset(buf, 0, (size_t)size);
 	printf("THE FOLLOWING DISK SECTORS COULD NOT BE READ:");
 	for (cp = buf, i = 0; i < size; i += secsize, cp += secsize) {
 		if (pread(fd, cp, (int)secsize, offset + i) != secsize) {
 			if (secsize != dev_bsize && dev_bsize != 1)
 				printf(" %jd (%jd),",
 				    (intmax_t)(blk * dev_bsize + i) / secsize,
 				    (intmax_t)blk + i / dev_bsize);
 			else
 				printf(" %jd,", (intmax_t)blk + i / dev_bsize);
 			errs++;
 		}
 	}
 	printf("\n");
 	if (errs)
 		resolved = 0;
 	return (errs);
 }
 
 void
 blwrite(int fd, char *buf, ufs2_daddr_t blk, ssize_t size)
 {
 	int i;
 	char *cp;
 	off_t offset;
 
 	if (fd < 0)
 		return;
 	offset = blk;
 	offset *= dev_bsize;
 	if (pwrite(fd, buf, size, offset) == size) {
 		fsmodified = 1;
 		return;
 	}
 	resolved = 0;
 	rwerror("WRITE BLK", blk);
 	printf("THE FOLLOWING SECTORS COULD NOT BE WRITTEN:");
 	for (cp = buf, i = 0; i < size; i += dev_bsize, cp += dev_bsize)
 		if (pwrite(fd, cp, dev_bsize, offset + i) != dev_bsize)
 			printf(" %jd,", (intmax_t)blk + i / dev_bsize);
 	printf("\n");
 	return;
 }
 
 void
 blerase(int fd, ufs2_daddr_t blk, long size)
 {
 	off_t ioarg[2];
 
 	if (fd < 0)
 		return;
 	ioarg[0] = blk * dev_bsize;
 	ioarg[1] = size;
 	ioctl(fd, DIOCGDELETE, ioarg);
 	/* we don't really care if we succeed or not */
 	return;
 }
 
 /*
  * Fill a contiguous region with all-zeroes.  Note ZEROBUFSIZE is by
  * definition a multiple of dev_bsize.
  */
 void
 blzero(int fd, ufs2_daddr_t blk, long size)
 {
 	static char *zero;
 	off_t offset, len;
 
 	if (fd < 0)
 		return;
 	if (zero == NULL) {
 		zero = calloc(ZEROBUFSIZE, 1);
 		if (zero == NULL)
 			errx(EEXIT, "cannot allocate buffer pool");
 	}
 	offset = blk * dev_bsize;
 	if (lseek(fd, offset, 0) < 0)
 		rwerror("SEEK BLK", blk);
 	while (size > 0) {
 		len = MIN(ZEROBUFSIZE, size);
 		if (write(fd, zero, len) != len)
 			rwerror("WRITE BLK", blk);
 		blk += len / dev_bsize;
 		size -= len;
 	}
 }
 
 /*
  * Verify cylinder group's magic number and other parameters.  If the
  * test fails, offer an option to rebuild the whole cylinder group.
  */
 #undef CHK
 #define CHK(lhs, op, rhs, fmt)						\
 	if (lhs op rhs) {						\
 		pwarn("UFS%d cylinder group %d failed: "		\
 		    "%s (" #fmt ") %s %s (" #fmt ")\n",			\
 		    sblock.fs_magic == FS_UFS1_MAGIC ? 1 : 2, cg,	\
 		    #lhs, (intmax_t)lhs, #op, #rhs, (intmax_t)rhs);	\
 		error = 1;						\
 	}
 int
 check_cgmagic(int cg, struct bufarea *cgbp, int request_rebuild)
 {
 	struct cg *cgp = cgbp->b_un.b_cg;
 	uint32_t cghash, calchash;
 	static int prevfailcg = -1;
 	long start;
 	int error;
 
 	/*
 	 * Extended cylinder group checks.
 	 */
 	calchash = cgp->cg_ckhash;
 	if ((sblock.fs_metackhash & CK_CYLGRP) != 0 &&
 	    (ckhashadd & CK_CYLGRP) == 0) {
 		cghash = cgp->cg_ckhash;
 		cgp->cg_ckhash = 0;
 		calchash = calculate_crc32c(~0L, (void *)cgp, sblock.fs_cgsize);
 		cgp->cg_ckhash = cghash;
 	}
 	error = 0;
 	CHK(cgp->cg_ckhash, !=, calchash, "%jd");
 	CHK(cg_chkmagic(cgp), ==, 0, "%jd");
 	CHK(cgp->cg_cgx, !=, cg, "%jd");
 	CHK(cgp->cg_ndblk, >, sblock.fs_fpg, "%jd");
 	if (sblock.fs_magic == FS_UFS1_MAGIC) {
 		CHK(cgp->cg_old_niblk, !=, sblock.fs_ipg, "%jd");
 		CHK(cgp->cg_old_ncyl, >, sblock.fs_old_cpg, "%jd");
 	} else if (sblock.fs_magic == FS_UFS2_MAGIC) {
 		CHK(cgp->cg_niblk, !=, sblock.fs_ipg, "%jd");
 		CHK(cgp->cg_initediblk, >, sblock.fs_ipg, "%jd");
 	}
 	if (cgbase(&sblock, cg) + sblock.fs_fpg < sblock.fs_size) {
 		CHK(cgp->cg_ndblk, !=, sblock.fs_fpg, "%jd");
 	} else {
 		CHK(cgp->cg_ndblk, !=, sblock.fs_size - cgbase(&sblock, cg),
 		    "%jd");
 	}
 	start = &cgp->cg_space[0] - (u_char *)(&cgp->cg_firstfield);
 	if (sblock.fs_magic == FS_UFS2_MAGIC) {
 		CHK(cgp->cg_iusedoff, !=, start, "%jd");
 	} else if (sblock.fs_magic == FS_UFS1_MAGIC) {
 		CHK(cgp->cg_niblk, !=, 0, "%jd");
 		CHK(cgp->cg_initediblk, !=, 0, "%jd");
 		CHK(cgp->cg_old_ncyl, !=, sblock.fs_old_cpg, "%jd");
 		CHK(cgp->cg_old_niblk, !=, sblock.fs_ipg, "%jd");
 		CHK(cgp->cg_old_btotoff, !=, start, "%jd");
 		CHK(cgp->cg_old_boff, !=, cgp->cg_old_btotoff +
 		    sblock.fs_old_cpg * sizeof(int32_t), "%jd");
 		CHK(cgp->cg_iusedoff, !=, cgp->cg_old_boff +
 		    sblock.fs_old_cpg * sizeof(u_int16_t), "%jd");
 	}
 	CHK(cgp->cg_freeoff, !=,
 	    cgp->cg_iusedoff + howmany(sblock.fs_ipg, CHAR_BIT), "%jd");
 	if (sblock.fs_contigsumsize == 0) {
 		CHK(cgp->cg_nextfreeoff, !=,
 		    cgp->cg_freeoff + howmany(sblock.fs_fpg, CHAR_BIT), "%jd");
 	} else {
 		CHK(cgp->cg_nclusterblks, !=, cgp->cg_ndblk / sblock.fs_frag,
 		    "%jd");
 		CHK(cgp->cg_clustersumoff, !=,
 		    roundup(cgp->cg_freeoff + howmany(sblock.fs_fpg, CHAR_BIT),
 		    sizeof(u_int32_t)) - sizeof(u_int32_t), "%jd");
 		CHK(cgp->cg_clusteroff, !=, cgp->cg_clustersumoff +
 		    (sblock.fs_contigsumsize + 1) * sizeof(u_int32_t), "%jd");
 		CHK(cgp->cg_nextfreeoff, !=, cgp->cg_clusteroff +
 		    howmany(fragstoblks(&sblock, sblock.fs_fpg), CHAR_BIT),
 		    "%jd");
 	}
 	if (error == 0)
 		return (1);
 	if (prevfailcg == cg)
 		return (0);
 	prevfailcg = cg;
 	pfatal("CYLINDER GROUP %d: INTEGRITY CHECK FAILED", cg);
 	if (!request_rebuild) {
 		printf("\n");
 		return (0);
 	}
 	if (!reply("REBUILD CYLINDER GROUP")) {
 		printf("YOU WILL NEED TO RERUN FSCK.\n");
 		rerun = 1;
 		return (1);
 	}
 	/*
 	 * Zero out the cylinder group and then initialize critical fields.
 	 * Bit maps and summaries will be recalculated by later passes.
 	 */
 	memset(cgp, 0, (size_t)sblock.fs_cgsize);
 	cgp->cg_magic = CG_MAGIC;
 	cgp->cg_cgx = cg;
 	cgp->cg_niblk = sblock.fs_ipg;
 	cgp->cg_initediblk = MIN(sblock.fs_ipg, 2 * INOPB(&sblock));
 	if (cgbase(&sblock, cg) + sblock.fs_fpg < sblock.fs_size)
 		cgp->cg_ndblk = sblock.fs_fpg;
 	else
 		cgp->cg_ndblk = sblock.fs_size - cgbase(&sblock, cg);
 	start = &cgp->cg_space[0] - (u_char *)(&cgp->cg_firstfield);
 	if (sblock.fs_magic == FS_UFS2_MAGIC) {
 		cgp->cg_iusedoff = start;
 	} else if (sblock.fs_magic == FS_UFS1_MAGIC) {
 		cgp->cg_niblk = 0;
 		cgp->cg_initediblk = 0;
 		cgp->cg_old_ncyl = sblock.fs_old_cpg;
 		cgp->cg_old_niblk = sblock.fs_ipg;
 		cgp->cg_old_btotoff = start;
 		cgp->cg_old_boff = cgp->cg_old_btotoff +
 		    sblock.fs_old_cpg * sizeof(int32_t);
 		cgp->cg_iusedoff = cgp->cg_old_boff +
 		    sblock.fs_old_cpg * sizeof(u_int16_t);
 	}
 	cgp->cg_freeoff = cgp->cg_iusedoff + howmany(sblock.fs_ipg, CHAR_BIT);
 	cgp->cg_nextfreeoff = cgp->cg_freeoff + howmany(sblock.fs_fpg,CHAR_BIT);
 	if (sblock.fs_contigsumsize > 0) {
 		cgp->cg_nclusterblks = cgp->cg_ndblk / sblock.fs_frag;
 		cgp->cg_clustersumoff =
 		    roundup(cgp->cg_nextfreeoff, sizeof(u_int32_t));
 		cgp->cg_clustersumoff -= sizeof(u_int32_t);
 		cgp->cg_clusteroff = cgp->cg_clustersumoff +
 		    (sblock.fs_contigsumsize + 1) * sizeof(u_int32_t);
 		cgp->cg_nextfreeoff = cgp->cg_clusteroff +
 		    howmany(fragstoblks(&sblock, sblock.fs_fpg), CHAR_BIT);
 	}
 	cgp->cg_ckhash = calculate_crc32c(~0L, (void *)cgp, sblock.fs_cgsize);
 	cgdirty(cgbp);
 	return (0);
 }
 
 /*
  * allocate a data block with the specified number of fragments
  */
 ufs2_daddr_t
 allocblk(long startcg, long frags,
     ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags))
 {
 	ufs2_daddr_t blkno, newblk;
 
 	if (sujrecovery && checkblkavail == std_checkblkavail) {
 		pfatal("allocblk: std_checkblkavail used for SUJ recovery\n");
 		return (0);
 	}
 	if (frags <= 0 || frags > sblock.fs_frag)
 		return (0);
 	for (blkno = MAX(cgdata(&sblock, startcg), 0);
 	     blkno < maxfsblock - sblock.fs_frag;
 	     blkno += sblock.fs_frag) {
 		if ((newblk = (*checkblkavail)(blkno, frags)) == 0)
 			continue;
 		if (newblk > 0)
 			return (newblk);
 		if (newblk < 0)
 			blkno = -newblk;
 	}
 	for (blkno = MAX(cgdata(&sblock, 0), 0);
 	     blkno < cgbase(&sblock, startcg) - sblock.fs_frag;
 	     blkno += sblock.fs_frag) {
 		if ((newblk = (*checkblkavail)(blkno, frags)) == 0)
 			continue;
 		if (newblk > 0)
 			return (newblk);
 		if (newblk < 0)
 			blkno = -newblk;
 	}
 	return (0);
 }
 
 ufs2_daddr_t
-std_checkblkavail(blkno, frags)
-	ufs2_daddr_t blkno;
-	long frags;
+std_checkblkavail(ufs2_daddr_t blkno, long frags)
 {
 	struct bufarea *cgbp;
 	struct cg *cgp;
 	ufs2_daddr_t j, k, baseblk;
 	long cg;
 
 	if ((u_int64_t)blkno > sblock.fs_size)
 		return (0);
 	for (j = 0; j <= sblock.fs_frag - frags; j++) {
 		if (testbmap(blkno + j))
 			continue;
 		for (k = 1; k < frags; k++)
 			if (testbmap(blkno + j + k))
 				break;
 		if (k < frags) {
 			j += k;
 			continue;
 		}
 		cg = dtog(&sblock, blkno + j);
 		cgbp = cglookup(cg);
 		cgp = cgbp->b_un.b_cg;
 		if (!check_cgmagic(cg, cgbp, 0))
 			return (-((cg + 1) * sblock.fs_fpg - sblock.fs_frag));
 		baseblk = dtogd(&sblock, blkno + j);
 		for (k = 0; k < frags; k++) {
 			setbmap(blkno + j + k);
 			clrbit(cg_blksfree(cgp), baseblk + k);
 		}
 		n_blks += frags;
 		if (frags == sblock.fs_frag)
 			cgp->cg_cs.cs_nbfree--;
 		else
 			cgp->cg_cs.cs_nffree -= frags;
 		cgdirty(cgbp);
 		return (blkno + j);
 	}
 	return (0);
 }
 
 /*
  * Slow down IO so as to leave some disk bandwidth for other processes
  */
 void
 slowio_start()
 {
 
 	/* Delay one in every 8 operations */
 	slowio_pollcnt = (slowio_pollcnt + 1) & 7;
 	if (slowio_pollcnt == 0) {
 		gettimeofday(&slowio_starttime, NULL);
 	}
 }
 
 void
 slowio_end()
 {
 	struct timeval tv;
 	int delay_usec;
 
 	if (slowio_pollcnt != 0)
 		return;
 
 	/* Update the slowdown interval. */
 	gettimeofday(&tv, NULL);
 	delay_usec = (tv.tv_sec - slowio_starttime.tv_sec) * 1000000 +
 	    (tv.tv_usec - slowio_starttime.tv_usec);
 	if (delay_usec < 64)
 		delay_usec = 64;
 	if (delay_usec > 2500000)
 		delay_usec = 2500000;
 	slowio_delay_usec = (slowio_delay_usec * 63 + delay_usec) >> 6;
 	/* delay by 8 times the average IO delay */
 	if (slowio_delay_usec > 64)
 		usleep(slowio_delay_usec * 8);
 }
 
 /*
  * Find a pathname
  */
 void
 getpathname(char *namebuf, ino_t curdir, ino_t ino)
 {
 	int len;
 	char *cp;
 	struct inode ip;
 	struct inodesc idesc;
 	static int busy = 0;
 
 	if (curdir == ino && ino == UFS_ROOTINO) {
 		(void)strcpy(namebuf, "/");
 		return;
 	}
 	if (busy || !INO_IS_DVALID(curdir)) {
 		(void)strcpy(namebuf, "?");
 		return;
 	}
 	busy = 1;
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_type = DATA;
 	idesc.id_fix = IGNORE;
 	cp = &namebuf[MAXPATHLEN - 1];
 	*cp = '\0';
 	if (curdir != ino) {
 		idesc.id_parent = curdir;
 		goto namelookup;
 	}
 	while (ino != UFS_ROOTINO) {
 		idesc.id_number = ino;
 		idesc.id_func = findino;
 		idesc.id_name = strdup("..");
 		ginode(ino, &ip);
 		if ((ckinode(ip.i_dp, &idesc) & FOUND) == 0) {
 			irelse(&ip);
+			free(idesc.id_name);
 			break;
 		}
 		irelse(&ip);
+		free(idesc.id_name);
 	namelookup:
 		idesc.id_number = idesc.id_parent;
 		idesc.id_parent = ino;
 		idesc.id_func = findname;
 		idesc.id_name = namebuf;
 		ginode(idesc.id_number, &ip);
 		if ((ckinode(ip.i_dp, &idesc) & FOUND) == 0) {
 			irelse(&ip);
 			break;
 		}
 		irelse(&ip);
 		len = strlen(namebuf);
 		cp -= len;
 		memmove(cp, namebuf, (size_t)len);
 		*--cp = '/';
 		if (cp < &namebuf[UFS_MAXNAMLEN])
 			break;
 		ino = idesc.id_number;
 	}
 	busy = 0;
 	if (ino != UFS_ROOTINO)
 		*--cp = '?';
 	memmove(namebuf, cp, (size_t)(&namebuf[MAXPATHLEN] - cp));
 }
 
 void
 catch(int sig __unused)
 {
 
 	ckfini(0);
 	exit(12);
 }
 
 /*
  * When preening, allow a single quit to signal
  * a special exit after file system checks complete
  * so that reboot sequence may be interrupted.
  */
 void
 catchquit(int sig __unused)
 {
 	printf("returning to single-user after file system check\n");
 	returntosingle = 1;
 	(void)signal(SIGQUIT, SIG_DFL);
 }
 
 /*
  * determine whether an inode should be fixed.
  */
 int
 dofix(struct inodesc *idesc, const char *msg)
 {
 
 	switch (idesc->id_fix) {
 
 	case DONTKNOW:
 		if (idesc->id_type == DATA)
 			direrror(idesc->id_number, msg);
 		else
 			pwarn("%s", msg);
 		if (preen) {
 			printf(" (SALVAGED)\n");
 			idesc->id_fix = FIX;
 			return (ALTERED);
 		}
 		if (reply("SALVAGE") == 0) {
 			idesc->id_fix = NOFIX;
 			return (0);
 		}
 		idesc->id_fix = FIX;
 		return (ALTERED);
 
 	case FIX:
 		return (ALTERED);
 
 	case NOFIX:
 	case IGNORE:
 		return (0);
 
 	default:
 		errx(EEXIT, "UNKNOWN INODESC FIX MODE %d", idesc->id_fix);
 	}
 	/* NOTREACHED */
 	return (0);
 }
 
 #include <stdarg.h>
 
 /*
  * Print details about a buffer.
  */
 void
 prtbuf(struct bufarea *bp, const char *fmt, ...)
 {
 	va_list ap;
 	va_start(ap, fmt);
 	if (preen)
 		(void)fprintf(stdout, "%s: ", cdevname);
 	(void)vfprintf(stdout, fmt, ap);
 	va_end(ap);
 	printf(": bp %p, type %s, bno %jd, size %d, refcnt %d, flags %s, "
 	    "index %jd\n", bp, BT_BUFTYPE(bp->b_type), (intmax_t) bp->b_bno,
 	    bp->b_size, bp->b_refcnt, bp->b_flags & B_DIRTY ? "dirty" : "clean",
 	    (intmax_t) bp->b_index);
 }
 
 /*
  * An unexpected inconsistency occurred.
  * Die if preening or file system is running with soft dependency protocol,
  * otherwise just print message and continue.
  */
 void
 pfatal(const char *fmt, ...)
 {
 	va_list ap;
 	va_start(ap, fmt);
 	if (!preen) {
 		(void)vfprintf(stdout, fmt, ap);
 		va_end(ap);
 		if (usedsoftdep)
 			(void)fprintf(stdout,
 			    "\nUNEXPECTED SOFT UPDATE INCONSISTENCY\n");
 		/*
 		 * Force foreground fsck to clean up inconsistency.
 		 */
 		if (bkgrdflag) {
 			cmd.value = FS_NEEDSFSCK;
 			cmd.size = 1;
 			if (sysctlbyname("vfs.ffs.setflags", 0, 0,
 			    &cmd, sizeof cmd) == -1)
 				pwarn("CANNOT SET FS_NEEDSFSCK FLAG\n");
 			fprintf(stdout, "CANNOT RUN IN BACKGROUND\n");
 			ckfini(0);
 			exit(EEXIT);
 		}
 		return;
 	}
 	if (cdevname == NULL)
 		cdevname = strdup("fsck");
 	(void)fprintf(stdout, "%s: ", cdevname);
 	(void)vfprintf(stdout, fmt, ap);
 	(void)fprintf(stdout,
 	    "\n%s: UNEXPECTED%sINCONSISTENCY; RUN fsck MANUALLY.\n",
 	    cdevname, usedsoftdep ? " SOFT UPDATE " : " ");
 	/*
 	 * Force foreground fsck to clean up inconsistency.
 	 */
 	if (bkgrdflag) {
 		cmd.value = FS_NEEDSFSCK;
 		cmd.size = 1;
 		if (sysctlbyname("vfs.ffs.setflags", 0, 0,
 		    &cmd, sizeof cmd) == -1)
 			pwarn("CANNOT SET FS_NEEDSFSCK FLAG\n");
 	}
 	ckfini(0);
 	exit(EEXIT);
 }
 
 /*
  * Pwarn just prints a message when not preening or running soft dependency
  * protocol, or a warning (preceded by filename) when preening.
  */
 void
 pwarn(const char *fmt, ...)
 {
 	va_list ap;
 	va_start(ap, fmt);
 	if (preen)
 		(void)fprintf(stdout, "%s: ", cdevname);
 	(void)vfprintf(stdout, fmt, ap);
 	va_end(ap);
 }
 
 /*
  * Stub for routines from kernel.
  */
 void
 panic(const char *fmt, ...)
 {
 	va_list ap;
 	va_start(ap, fmt);
 	pfatal("INTERNAL INCONSISTENCY:");
 	(void)vfprintf(stdout, fmt, ap);
 	va_end(ap);
 	exit(EEXIT);
 }
diff --git a/sbin/fsck_ffs/inode.c b/sbin/fsck_ffs/inode.c
index 057d49a1ea18..947e5e0cbc08 100644
--- a/sbin/fsck_ffs/inode.c
+++ b/sbin/fsck_ffs/inode.c
@@ -1,1471 +1,1463 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1980, 1986, 1993
  *	The Regents of the University of California.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #if 0
 #ifndef lint
 static const char sccsid[] = "@(#)inode.c	8.8 (Berkeley) 4/28/95";
 #endif /* not lint */
 #endif
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/stat.h>
 #include <sys/stdint.h>
 #include <sys/sysctl.h>
 
 #include <ufs/ufs/dinode.h>
 #include <ufs/ufs/dir.h>
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <pwd.h>
 #include <string.h>
 #include <time.h>
 #include <libufs.h>
 
 #include "fsck.h"
 
 struct bufarea *icachebp;	/* inode cache buffer */
 
 static int iblock(struct inodesc *, off_t isize, int type);
 static ufs2_daddr_t indir_blkatoff(ufs2_daddr_t, ino_t, ufs_lbn_t, ufs_lbn_t,
     struct bufarea **);
 static int snapclean(struct inodesc *idesc);
 static void chkcopyonwrite(struct fs *, ufs2_daddr_t,
     ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t, long));
 
 int
 ckinode(union dinode *dp, struct inodesc *idesc)
 {
 	off_t remsize, sizepb;
 	int i, offset, ret;
 	struct inode ip;
 	union dinode dino;
 	ufs2_daddr_t ndb;
 	mode_t mode;
 	char pathbuf[MAXPATHLEN + 1];
 
 	if (idesc->id_fix != IGNORE)
 		idesc->id_fix = DONTKNOW;
 	idesc->id_dp = dp;
 	idesc->id_lbn = -1;
 	idesc->id_lballoc = -1;
 	idesc->id_level = 0;
 	idesc->id_entryno = 0;
 	idesc->id_filesize = DIP(dp, di_size);
 	mode = DIP(dp, di_mode) & IFMT;
 	if (mode == IFBLK || mode == IFCHR || (mode == IFLNK &&
 	    DIP(dp, di_size) < (unsigned)sblock.fs_maxsymlinklen))
 		return (KEEPON);
 	if (sblock.fs_magic == FS_UFS1_MAGIC)
 		dino.dp1 = dp->dp1;
 	else
 		dino.dp2 = dp->dp2;
 	ndb = howmany(DIP(&dino, di_size), sblock.fs_bsize);
 	for (i = 0; i < UFS_NDADDR; i++) {
 		idesc->id_lbn++;
 		if (--ndb == 0 &&
 		    (offset = blkoff(&sblock, DIP(&dino, di_size))) != 0)
 			idesc->id_numfrags =
 				numfrags(&sblock, fragroundup(&sblock, offset));
 		else
 			idesc->id_numfrags = sblock.fs_frag;
 		if (DIP(&dino, di_db[i]) == 0) {
 			if (idesc->id_type == DATA && ndb >= 0) {
 				/* An empty block in a directory XXX */
 				getpathname(pathbuf, idesc->id_number,
 						idesc->id_number);
 				pfatal("DIRECTORY %s: CONTAINS EMPTY BLOCKS",
 					pathbuf);
 				if (reply("ADJUST LENGTH") == 1) {
 					ginode(idesc->id_number, &ip);
 					DIP_SET(ip.i_dp, di_size,
 					    i * sblock.fs_bsize);
 					printf(
 					    "YOU MUST RERUN FSCK AFTERWARDS\n");
 					rerun = 1;
 					inodirty(&ip);
 					irelse(&ip);
 				}
 			}
 			continue;
 		}
 		idesc->id_blkno = DIP(&dino, di_db[i]);
 		if (idesc->id_type != DATA)
 			ret = (*idesc->id_func)(idesc);
 		else
 			ret = dirscan(idesc);
 		if (ret & STOP)
 			return (ret);
 	}
 	idesc->id_numfrags = sblock.fs_frag;
 	remsize = DIP(&dino, di_size) - sblock.fs_bsize * UFS_NDADDR;
 	sizepb = sblock.fs_bsize;
 	for (i = 0; i < UFS_NIADDR; i++) {
 		sizepb *= NINDIR(&sblock);
 		idesc->id_level = i + 1;
 		if (DIP(&dino, di_ib[i])) {
 			idesc->id_blkno = DIP(&dino, di_ib[i]);
 			ret = iblock(idesc, remsize, BT_LEVEL1 + i);
 			if (ret & STOP)
 				return (ret);
 		} else if (remsize > 0) {
 			idesc->id_lbn += sizepb / sblock.fs_bsize;
 			if (idesc->id_type == DATA) {
 				/* An empty block in a directory XXX */
 				getpathname(pathbuf, idesc->id_number,
 						idesc->id_number);
 				pfatal("DIRECTORY %s: CONTAINS EMPTY BLOCKS",
 					pathbuf);
 				if (reply("ADJUST LENGTH") == 1) {
 					ginode(idesc->id_number, &ip);
 					DIP_SET(ip.i_dp, di_size,
 					    DIP(ip.i_dp, di_size) - remsize);
 					remsize = 0;
 					printf(
 					    "YOU MUST RERUN FSCK AFTERWARDS\n");
 					rerun = 1;
 					inodirty(&ip);
 					irelse(&ip);
 					break;
 				}
 			}
 		}
 		remsize -= sizepb;
 	}
 	return (KEEPON);
 }
 
 static int
 iblock(struct inodesc *idesc, off_t isize, int type)
 {
 	struct inode ip;
 	struct bufarea *bp;
 	int i, n, (*func)(struct inodesc *), nif;
 	off_t sizepb;
 	char buf[BUFSIZ];
 	char pathbuf[MAXPATHLEN + 1];
 
 	if (idesc->id_type != DATA) {
 		func = idesc->id_func;
 		if (((n = (*func)(idesc)) & KEEPON) == 0)
 			return (n);
 	} else
 		func = dirscan;
 	bp = getdatablk(idesc->id_blkno, sblock.fs_bsize, type);
 	if (bp->b_errs != 0) {
 		brelse(bp);
 		return (SKIP);
 	}
 	idesc->id_bp = bp;
 	idesc->id_level--;
 	for (sizepb = sblock.fs_bsize, i = 0; i < idesc->id_level; i++)
 		sizepb *= NINDIR(&sblock);
 	if (howmany(isize, sizepb) > NINDIR(&sblock))
 		nif = NINDIR(&sblock);
 	else
 		nif = howmany(isize, sizepb);
 	if (idesc->id_func == pass1check && nif < NINDIR(&sblock)) {
 		for (i = nif; i < NINDIR(&sblock); i++) {
 			if (IBLK(bp, i) == 0)
 				continue;
 			(void)sprintf(buf, "PARTIALLY TRUNCATED INODE I=%lu",
 			    (u_long)idesc->id_number);
 			if (preen) {
 				pfatal("%s", buf);
 			} else if (dofix(idesc, buf)) {
 				IBLK_SET(bp, i, 0);
 				dirty(bp);
 			}
 		}
 		flush(fswritefd, bp);
 	}
 	for (i = 0; i < nif; i++) {
 		if (IBLK(bp, i)) {
 			idesc->id_blkno = IBLK(bp, i);
 			bp->b_index = i;
 			if (idesc->id_level == 0) {
 				idesc->id_lbn++;
 				n = (*func)(idesc);
 			} else {
 				n = iblock(idesc, isize, type - 1);
 				idesc->id_level++;
 			}
 			if (n & STOP) {
 				brelse(bp);
 				return (n);
 			}
 		} else {
 			idesc->id_lbn += sizepb / sblock.fs_bsize;
 			if (idesc->id_type == DATA && isize > 0) {
 				/* An empty block in a directory XXX */
 				getpathname(pathbuf, idesc->id_number,
 						idesc->id_number);
 				pfatal("DIRECTORY %s: CONTAINS EMPTY BLOCKS",
 					pathbuf);
 				if (reply("ADJUST LENGTH") == 1) {
 					ginode(idesc->id_number, &ip);
 					DIP_SET(ip.i_dp, di_size,
 					    DIP(ip.i_dp, di_size) - isize);
 					isize = 0;
 					printf(
 					    "YOU MUST RERUN FSCK AFTERWARDS\n");
 					rerun = 1;
 					inodirty(&ip);
 					brelse(bp);
 					return(STOP);
 				}
 			}
 		}
 		isize -= sizepb;
 	}
 	brelse(bp);
 	return (KEEPON);
 }
 
 /*
  * Finds the disk block address at the specified lbn within the inode
  * specified by dp.  This follows the whole tree and honors di_size and
  * di_extsize so it is a true test of reachability.  The lbn may be
  * negative if an extattr or indirect block is requested.
  */
 ufs2_daddr_t
 ino_blkatoff(union dinode *dp, ino_t ino, ufs_lbn_t lbn, int *frags,
     struct bufarea **bpp)
 {
 	ufs_lbn_t tmpval;
 	ufs_lbn_t cur;
 	ufs_lbn_t next;
 	int i;
 
 	*frags = 0;
 	if (bpp != NULL)
 		*bpp = NULL;
 	/*
 	 * Handle extattr blocks first.
 	 */
 	if (lbn < 0 && lbn >= -UFS_NXADDR) {
 		lbn = -1 - lbn;
 		if (lbn > lblkno(&sblock, dp->dp2.di_extsize - 1))
 			return (0);
 		*frags = numfrags(&sblock,
 		    sblksize(&sblock, dp->dp2.di_extsize, lbn));
 		return (dp->dp2.di_extb[lbn]);
 	}
 	/*
 	 * Now direct and indirect.
 	 */
 	if (DIP(dp, di_mode) == IFLNK &&
 	    DIP(dp, di_size) < sblock.fs_maxsymlinklen)
 		return (0);
 	if (lbn >= 0 && lbn < UFS_NDADDR) {
 		*frags = numfrags(&sblock,
 		    sblksize(&sblock, DIP(dp, di_size), lbn));
 		return (DIP(dp, di_db[lbn]));
 	}
 	*frags = sblock.fs_frag;
 
 	for (i = 0, tmpval = NINDIR(&sblock), cur = UFS_NDADDR; i < UFS_NIADDR;
 	    i++, tmpval *= NINDIR(&sblock), cur = next) {
 		next = cur + tmpval;
 		if (lbn == -cur - i)
 			return (DIP(dp, di_ib[i]));
 		/*
 		 * Determine whether the lbn in question is within this tree.
 		 */
 		if (lbn < 0 && -lbn >= next)
 			continue;
 		if (lbn > 0 && lbn >= next)
 			continue;
 		if (DIP(dp, di_ib[i]) == 0)
 			return (0);
 		return (indir_blkatoff(DIP(dp, di_ib[i]), ino, -cur - i, lbn,
 		    bpp));
 	}
 	pfatal("lbn %jd not in ino %ju\n", lbn, (uintmax_t)ino);
 	return (0);
 }
 
 /*
  * Fetch an indirect block to find the block at a given lbn.  The lbn
  * may be negative to fetch a specific indirect block pointer or positive
  * to fetch a specific block.
  */
 static ufs2_daddr_t
 indir_blkatoff(ufs2_daddr_t blk, ino_t ino, ufs_lbn_t cur, ufs_lbn_t lbn,
     struct bufarea **bpp)
 {
 	struct bufarea *bp;
 	ufs_lbn_t lbnadd;
 	ufs_lbn_t base;
 	int i, level;
 
 	level = lbn_level(cur);
 	if (level == -1)
 		pfatal("Invalid indir lbn %jd in ino %ju\n",
 		    lbn, (uintmax_t)ino);
 	if (level == 0 && lbn < 0)
 		pfatal("Invalid lbn %jd in ino %ju\n",
 		    lbn, (uintmax_t)ino);
 	lbnadd = 1;
 	base = -(cur + level);
 	for (i = level; i > 0; i--)
 		lbnadd *= NINDIR(&sblock);
 	if (lbn > 0)
 		i = (lbn - base) / lbnadd;
 	else
 		i = (-lbn - base) / lbnadd;
 	if (i < 0 || i >= NINDIR(&sblock)) {
 		pfatal("Invalid indirect index %d produced by lbn %jd "
 		    "in ino %ju\n", i, lbn, (uintmax_t)ino);
 		return (0);
 	}
 	if (level == 0)
 		cur = base + (i * lbnadd);
 	else
 		cur = -(base + (i * lbnadd)) - (level - 1);
 	bp = getdatablk(blk, sblock.fs_bsize, BT_LEVEL1 + level);
 	if (bp->b_errs != 0)
 		return (0);
 	blk = IBLK(bp, i);
 	bp->b_index = i;
 	if (cur == lbn || blk == 0) {
 		if (bpp != NULL)
 			*bpp = bp;
 		else
 			brelse(bp);
 		return (blk);
 	}
 	brelse(bp);
 	if (level == 0)
 		pfatal("Invalid lbn %jd at level 0 for ino %ju\n", lbn,
 		    (uintmax_t)ino);
 	return (indir_blkatoff(blk, ino, cur, lbn, bpp));
 }
 
 /*
  * Check that a block in a legal block number.
  * Return 0 if in range, 1 if out of range.
  */
 int
 chkrange(ufs2_daddr_t blk, int cnt)
 {
 	int c;
 
 	if (cnt <= 0 || blk <= 0 || blk > maxfsblock ||
 	    cnt - 1 > maxfsblock - blk) {
 		if (debug)
 			printf("out of range: blk %ld, offset %i, size %d\n",
 			    (long)blk, (int)fragnum(&sblock, blk), cnt);
 		return (1);
 	}
 	if (cnt > sblock.fs_frag ||
 	    fragnum(&sblock, blk) + cnt > sblock.fs_frag) {
 		if (debug)
 			printf("bad size: blk %ld, offset %i, size %d\n",
 			    (long)blk, (int)fragnum(&sblock, blk), cnt);
 		return (1);
 	}
 	c = dtog(&sblock, blk);
 	if (blk < cgdmin(&sblock, c)) {
 		if ((blk + cnt) > cgsblock(&sblock, c)) {
 			if (debug) {
 				printf("blk %ld < cgdmin %ld;",
 				    (long)blk, (long)cgdmin(&sblock, c));
 				printf(" blk + cnt %ld > cgsbase %ld\n",
 				    (long)(blk + cnt),
 				    (long)cgsblock(&sblock, c));
 			}
 			return (1);
 		}
 	} else {
 		if ((blk + cnt) > cgbase(&sblock, c+1)) {
 			if (debug)  {
 				printf("blk %ld >= cgdmin %ld;",
 				    (long)blk, (long)cgdmin(&sblock, c));
 				printf(" blk + cnt %ld > sblock.fs_fpg %ld\n",
 				    (long)(blk + cnt), (long)sblock.fs_fpg);
 			}
 			return (1);
 		}
 	}
 	return (0);
 }
 
 /*
  * General purpose interface for reading inodes.
  *
  * firstinum and lastinum track contents of getnextino() cache (below).
  */
 static ino_t firstinum, lastinum;
 static struct bufarea inobuf;
 
 void
 ginode(ino_t inumber, struct inode *ip)
 {
 	ufs2_daddr_t iblk;
 
 	if (inumber < UFS_ROOTINO || inumber > maxino)
 		errx(EEXIT, "bad inode number %ju to ginode",
 		    (uintmax_t)inumber);
 	ip->i_number = inumber;
 	if (inumber >= firstinum && inumber < lastinum) {
 		/* contents in getnextino() cache */
 		ip->i_bp = &inobuf;
 		inobuf.b_refcnt++;
 		inobuf.b_index = firstinum;
 	} else if (icachebp != NULL &&
 	    inumber >= icachebp->b_index &&
 	    inumber < icachebp->b_index + INOPB(&sblock)) {
 		/* take an additional reference for the returned inode */
 		icachebp->b_refcnt++;
 		ip->i_bp = icachebp;
 	} else {
 		iblk = ino_to_fsba(&sblock, inumber);
 		/* release our cache-hold reference on old icachebp */
 		if (icachebp != NULL)
 			brelse(icachebp);
 		icachebp = getdatablk(iblk, sblock.fs_bsize, BT_INODES);
 		if (icachebp->b_errs != 0) {
 			icachebp = NULL;
 			ip->i_bp = NULL;
 			ip->i_dp = &zino;
 			return;
 		}
 		/* take a cache-hold reference on new icachebp */
 		icachebp->b_refcnt++;
 		icachebp->b_index = rounddown(inumber, INOPB(&sblock));
 		ip->i_bp = icachebp;
 	}
 	if (sblock.fs_magic == FS_UFS1_MAGIC) {
 		ip->i_dp = (union dinode *)
 		    &ip->i_bp->b_un.b_dinode1[inumber - ip->i_bp->b_index];
 		return;
 	}
 	ip->i_dp = (union dinode *)
 	    &ip->i_bp->b_un.b_dinode2[inumber - ip->i_bp->b_index];
 	if (ffs_verify_dinode_ckhash(&sblock, (struct ufs2_dinode *)ip->i_dp)) {
 		pwarn("INODE CHECK-HASH FAILED");
 		prtinode(ip);
 		if (preen || reply("FIX") != 0) {
 			if (preen)
 				printf(" (FIXED)\n");
 			ffs_update_dinode_ckhash(&sblock,
 			    (struct ufs2_dinode *)ip->i_dp);
 			inodirty(ip);
 		}
 	}
 }
 
 /*
  * Release a held inode.
  */
 void
 irelse(struct inode *ip)
 {
 
 	/* Check for failed inode read */
 	if (ip->i_bp == NULL)
 		return;
 	if (ip->i_bp->b_refcnt <= 0)
 		pfatal("irelse: releasing unreferenced ino %ju\n",
 		    (uintmax_t) ip->i_number);
 	brelse(ip->i_bp);
 }
 
 /*
  * Special purpose version of ginode used to optimize first pass
  * over all the inodes in numerical order.
  */
 static ino_t nextinum, lastvalidinum;
 static long readcount, readpercg, fullcnt, inobufsize, partialcnt, partialsize;
 
 union dinode *
 getnextinode(ino_t inumber, int rebuildcg)
 {
 	int j;
 	long size;
 	mode_t mode;
 	ufs2_daddr_t ndb, blk;
 	union dinode *dp;
 	struct inode ip;
 	static caddr_t nextinop;
 
 	if (inumber != nextinum++ || inumber > lastvalidinum)
 		errx(EEXIT, "bad inode number %ju to nextinode",
 		    (uintmax_t)inumber);
 	if (inumber >= lastinum) {
 		readcount++;
 		firstinum = lastinum;
 		blk = ino_to_fsba(&sblock, lastinum);
 		if (readcount % readpercg == 0) {
 			size = partialsize;
 			lastinum += partialcnt;
 		} else {
 			size = inobufsize;
 			lastinum += fullcnt;
 		}
 		/*
 		 * Flush old contents in case they have been updated.
 		 * If getblk encounters an error, it will already have zeroed
 		 * out the buffer, so we do not need to do so here.
 		 */
 		if (inobuf.b_refcnt != 0)
 			pfatal("Non-zero getnextinode() ref count %d\n",
 			    inobuf.b_refcnt);
 		flush(fswritefd, &inobuf);
 		getblk(&inobuf, blk, size);
 		nextinop = inobuf.b_un.b_buf;
 	}
 	dp = (union dinode *)nextinop;
 	if (sblock.fs_magic == FS_UFS1_MAGIC)
 		nextinop += sizeof(struct ufs1_dinode);
 	else
 		nextinop += sizeof(struct ufs2_dinode);
 	if ((ckhashadd & CK_INODE) != 0) {
 		ffs_update_dinode_ckhash(&sblock, (struct ufs2_dinode *)dp);
 		dirty(&inobuf);
 	}
 	if (ffs_verify_dinode_ckhash(&sblock, (struct ufs2_dinode *)dp) != 0) {
 		pwarn("INODE CHECK-HASH FAILED");
 		ip.i_bp = NULL;
 		ip.i_dp = dp;
 		ip.i_number = inumber;
 		prtinode(&ip);
 		if (preen || reply("FIX") != 0) {
 			if (preen)
 				printf(" (FIXED)\n");
 			ffs_update_dinode_ckhash(&sblock,
 			    (struct ufs2_dinode *)dp);
 			dirty(&inobuf);
 		}
 	}
 	if (rebuildcg && (char *)dp == inobuf.b_un.b_buf) {
 		/*
 		 * Try to determine if we have reached the end of the
 		 * allocated inodes.
 		 */
 		mode = DIP(dp, di_mode) & IFMT;
 		if (mode == 0) {
 			if (memcmp(dp->dp2.di_db, zino.dp2.di_db,
 				UFS_NDADDR * sizeof(ufs2_daddr_t)) ||
 			      memcmp(dp->dp2.di_ib, zino.dp2.di_ib,
 				UFS_NIADDR * sizeof(ufs2_daddr_t)) ||
 			      dp->dp2.di_mode || dp->dp2.di_size)
 				return (NULL);
 			return (dp);
 		}
 		if (!ftypeok(dp))
 			return (NULL);
 		ndb = howmany(DIP(dp, di_size), sblock.fs_bsize);
 		if (ndb < 0)
 			return (NULL);
 		if (mode == IFBLK || mode == IFCHR)
 			ndb++;
 		if (mode == IFLNK) {
 			/*
 			 * Fake ndb value so direct/indirect block checks below
 			 * will detect any garbage after symlink string.
 			 */
 			if (DIP(dp, di_size) < (off_t)sblock.fs_maxsymlinklen) {
 				ndb = howmany(DIP(dp, di_size),
 				    sizeof(ufs2_daddr_t));
 				if (ndb > UFS_NDADDR) {
 					j = ndb - UFS_NDADDR;
 					for (ndb = 1; j > 1; j--)
 						ndb *= NINDIR(&sblock);
 					ndb += UFS_NDADDR;
 				}
 			}
 		}
 		for (j = ndb; ndb < UFS_NDADDR && j < UFS_NDADDR; j++)
 			if (DIP(dp, di_db[j]) != 0)
 				return (NULL);
 		for (j = 0, ndb -= UFS_NDADDR; ndb > 0; j++)
 			ndb /= NINDIR(&sblock);
 		for (; j < UFS_NIADDR; j++)
 			if (DIP(dp, di_ib[j]) != 0)
 				return (NULL);
 	}
 	return (dp);
 }
 
 void
 setinodebuf(int cg, ino_t inosused)
 {
 	ino_t inum;
 
 	inum = cg * sblock.fs_ipg;
 	lastvalidinum = inum + inosused - 1;
 	nextinum = inum;
 	lastinum = inum;
 	readcount = 0;
 	/* Flush old contents in case they have been updated */
 	flush(fswritefd, &inobuf);
 	inobuf.b_bno = 0;
 	if (inobuf.b_un.b_buf == NULL) {
 		inobufsize = blkroundup(&sblock,
 		    MAX(INOBUFSIZE, sblock.fs_bsize));
 		initbarea(&inobuf, BT_INODES);
 		if ((inobuf.b_un.b_buf = Malloc((unsigned)inobufsize)) == NULL)
 			errx(EEXIT, "cannot allocate space for inode buffer");
 	}
 	fullcnt = inobufsize / ((sblock.fs_magic == FS_UFS1_MAGIC) ?
 	    sizeof(struct ufs1_dinode) : sizeof(struct ufs2_dinode));
 	readpercg = inosused / fullcnt;
 	partialcnt = inosused % fullcnt;
 	partialsize = fragroundup(&sblock,
 	    partialcnt * ((sblock.fs_magic == FS_UFS1_MAGIC) ?
 	    sizeof(struct ufs1_dinode) : sizeof(struct ufs2_dinode)));
 	if (partialcnt != 0) {
 		readpercg++;
 	} else {
 		partialcnt = fullcnt;
 		partialsize = inobufsize;
 	}
 }
 
 int
 freeblock(struct inodesc *idesc)
 {
 	struct dups *dlp;
 	struct bufarea *cgbp;
 	struct cg *cgp;
 	ufs2_daddr_t blkno;
 	long size, nfrags;
 
 	blkno = idesc->id_blkno;
 	if (idesc->id_type == SNAP) {
 		pfatal("clearing a snapshot dinode\n");
 		return (STOP);
 	}
 	size = lfragtosize(&sblock, idesc->id_numfrags);
 	if (snapblkfree(&sblock, blkno, size, idesc->id_number,
 	    std_checkblkavail))
 		return (KEEPON);
 	for (nfrags = idesc->id_numfrags; nfrags > 0; blkno++, nfrags--) {
 		if (chkrange(blkno, 1)) {
 			return (SKIP);
 		} else if (testbmap(blkno)) {
 			for (dlp = duplist; dlp; dlp = dlp->next) {
 				if (dlp->dup != blkno)
 					continue;
 				dlp->dup = duplist->dup;
 				dlp = duplist;
 				duplist = duplist->next;
 				free((char *)dlp);
 				break;
 			}
 			if (dlp == NULL) {
 				clrbmap(blkno);
 				n_blks--;
 			}
 		}
 	}
 	/*
 	 * If all successfully returned, account for them.
 	 */
 	if (nfrags == 0) {
 		cgbp = cglookup(dtog(&sblock, idesc->id_blkno));
 		cgp = cgbp->b_un.b_cg;
 		if (idesc->id_numfrags == sblock.fs_frag)
 			cgp->cg_cs.cs_nbfree++;
 		else
 			cgp->cg_cs.cs_nffree += idesc->id_numfrags;
 		cgdirty(cgbp);
 	}
 	return (KEEPON);
 }
 
 /*
  * Prepare a snapshot file for being removed.
  */
 void
 snapremove(ino_t inum)
 {
 	struct inodesc idesc;
 	struct inode ip;
 	int i;
 
 	for (i = 0; i < snapcnt; i++)
 		if (snaplist[i].i_number == inum)
 			break;
 	if (i == snapcnt)
 		ginode(inum, &ip);
 	else
 		ip = snaplist[i];
 	if ((DIP(ip.i_dp, di_flags) & SF_SNAPSHOT) == 0) {
 		printf("snapremove: inode %jd is not a snapshot\n",
 		    (intmax_t)inum);
 		if (i == snapcnt)
 			irelse(&ip);
 		return;
 	}
 	if (debug)
 		printf("snapremove: remove %sactive snapshot %jd\n",
 		    i == snapcnt ? "in" : "", (intmax_t)inum);
 	/*
 	 * If on active snapshot list, remove it.
 	 */
 	if (i < snapcnt) {
 		for (i++; i < FSMAXSNAP; i++) {
 			if (sblock.fs_snapinum[i] == 0)
 				break;
 			snaplist[i - 1] = snaplist[i];
 			sblock.fs_snapinum[i - 1] = sblock.fs_snapinum[i];
 		}
 		sblock.fs_snapinum[i - 1] = 0;
 		bzero(&snaplist[i - 1], sizeof(struct inode));
 		snapcnt--;
 	}
 	idesc.id_type = SNAP;
 	idesc.id_func = snapclean;
 	idesc.id_number = inum;
 	(void)ckinode(ip.i_dp, &idesc);
 	DIP_SET(ip.i_dp, di_flags, DIP(ip.i_dp, di_flags) & ~SF_SNAPSHOT);
 	inodirty(&ip);
 	irelse(&ip);
 }
 
 static int
 snapclean(struct inodesc *idesc)
 {
 	ufs2_daddr_t blkno;
 	struct bufarea *bp;
 	union dinode *dp;
 
 	blkno = idesc->id_blkno;
 	if (blkno == 0)
 		return (KEEPON);
 
 	bp = idesc->id_bp;
 	dp = idesc->id_dp;
 	if (blkno == BLK_NOCOPY || blkno == BLK_SNAP) {
 		if (idesc->id_lbn < UFS_NDADDR)
 			DIP_SET(dp, di_db[idesc->id_lbn], 0);
 		else
 			IBLK_SET(bp, bp->b_index, 0);
 		dirty(bp);
 	}
 	return (KEEPON);
 }
 
 /*
  * Notification that a block is being freed. Return zero if the free
  * should be allowed to proceed. Return non-zero if the snapshot file
  * wants to claim the block. The block will be claimed if it is an
  * uncopied part of one of the snapshots. It will be freed if it is
  * either a BLK_NOCOPY or has already been copied in all of the snapshots.
  * If a fragment is being freed, then all snapshots that care about
  * it must make a copy since a snapshot file can only claim full sized
  * blocks. Note that if more than one snapshot file maps the block,
  * we can pick one at random to claim it. Since none of the snapshots
  * can change, we are assurred that they will all see the same unmodified
  * image. When deleting a snapshot file (see ino_trunc above), we
  * must push any of these claimed blocks to one of the other snapshots
  * that maps it. These claimed blocks are easily identified as they will
  * have a block number equal to their logical block number within the
  * snapshot. A copied block can never have this property because they
  * must always have been allocated from a BLK_NOCOPY location.
  */
 int
-snapblkfree(fs, bno, size, inum, checkblkavail)
-	struct fs *fs;
-	ufs2_daddr_t bno;
-	long size;
-	ino_t inum;
-	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags);
+snapblkfree(struct fs *fs, ufs2_daddr_t bno, long size, ino_t inum,
+	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags))
 {
 	union dinode *dp;
 	struct inode ip;
 	struct bufarea *snapbp;
 	ufs_lbn_t lbn;
 	ufs2_daddr_t blkno, relblkno;
 	int i, frags, claimedblk, copydone;
 
 	/* If no snapshots, nothing to do */
 	if (snapcnt == 0)
 		return (0);
 	if (debug)
 		printf("snapblkfree: in ino %jd free blkno %jd, size %jd\n",
 		    (intmax_t)inum, (intmax_t)bno, (intmax_t)size);
 	relblkno = blknum(fs, bno);
 	lbn = fragstoblks(fs, relblkno);
 	/* Direct blocks are always pre-copied */
 	if (lbn < UFS_NDADDR)
 		return (0);
 	copydone = 0;
 	claimedblk = 0;
 	for (i = 0; i < snapcnt; i++) {
 		/*
 		 * Lookup block being freed.
 		 */
 		ip = snaplist[i];
 		dp = ip.i_dp;
 		blkno = ino_blkatoff(dp, inum != 0 ? inum : ip.i_number,
 		    lbn, &frags, &snapbp);
 		/*
 		 * Check to see if block needs to be copied.
 		 */
 		if (blkno == 0) {
 			/*
 			 * A block that we map is being freed. If it has not
 			 * been claimed yet, we will claim or copy it (below).
 			 */
 			claimedblk = 1;
 		} else if (blkno == BLK_SNAP) {
 			/*
 			 * No previous snapshot claimed the block,
 			 * so it will be freed and become a BLK_NOCOPY
 			 * (don't care) for us.
 			 */
 			if (claimedblk)
 				pfatal("snapblkfree: inconsistent block type");
 			IBLK_SET(snapbp, snapbp->b_index, BLK_NOCOPY);
 			dirty(snapbp);
 			brelse(snapbp);
 			continue;
 		} else /* BLK_NOCOPY or default */ {
 			/*
 			 * If the snapshot has already copied the block
 			 * (default), or does not care about the block,
 			 * it is not needed.
 			 */
 			brelse(snapbp);
 			continue;
 		}
 		/*
 		 * If this is a full size block, we will just grab it
 		 * and assign it to the snapshot inode. Otherwise we
 		 * will proceed to copy it. See explanation for this
 		 * routine as to why only a single snapshot needs to
 		 * claim this block.
 		 */
 		if (size == fs->fs_bsize) {
 			if (debug)
 				printf("Grabonremove snapshot %ju lbn %jd "
 				    "from inum %ju\n", (intmax_t)ip.i_number,
 				    (intmax_t)lbn, (uintmax_t)inum);
 			IBLK_SET(snapbp, snapbp->b_index, relblkno);
 			dirty(snapbp);
 			brelse(snapbp);
 			DIP_SET(dp, di_blocks,
 			    DIP(dp, di_blocks) + btodb(size));
 			inodirty(&ip);
 			return (1);
 		}
 
 		/* First time through, read the contents of the old block. */
 		if (copydone == 0) {
 			copydone = 1;
 			if (blread(fsreadfd, copybuf, fsbtodb(fs, relblkno),
 			    fs->fs_bsize) != 0) {
 				pfatal("Could not read snapshot %ju block "
 				    "%jd\n", (intmax_t)ip.i_number,
 				    (intmax_t)relblkno);
 				continue;
 			}
 		}
 		/*
 		 * This allocation will never require any additional
 		 * allocations for the snapshot inode.
 		 */
 		blkno = allocblk(dtog(fs, relblkno), fs->fs_frag,
 		    checkblkavail);
 		if (blkno == 0) {
 			pfatal("Could not allocate block for snapshot %ju\n",
 			    (intmax_t)ip.i_number);
 			continue;
 		}
 		if (debug)
 			printf("Copyonremove: snapino %jd lbn %jd for inum %ju "
 			    "size %ld new blkno %jd\n", (intmax_t)ip.i_number,
 			    (intmax_t)lbn, (uintmax_t)inum, size,
 			    (intmax_t)blkno);
 		blwrite(fswritefd, copybuf, fsbtodb(fs, blkno), fs->fs_bsize);
 		IBLK_SET(snapbp, snapbp->b_index, blkno);
 		dirty(snapbp);
 		brelse(snapbp);
 		DIP_SET(dp, di_blocks,
 		    DIP(dp, di_blocks) + btodb(fs->fs_bsize));
 		inodirty(&ip);
 	}
 	return (0);
 }
 
 /*
  * Notification that a block is being written. Return if the block
  * is part of a snapshot as snapshots never track other snapshots.
  * The block will be copied in all of the snapshots that are tracking
  * it and have not yet copied it. Some buffers may hold more than one
  * block. Here we need to check each block in the buffer.
  */
 void
-copyonwrite(fs, bp, checkblkavail)
-	struct fs *fs;
-	struct bufarea *bp;
-	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags);
+copyonwrite(struct fs *fs, struct bufarea *bp,
+	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags))
 {
 	ufs2_daddr_t copyblkno;
 	long i, numblks;
 
 	/* If no snapshots, nothing to do. */
 	if (snapcnt == 0)
 		return;
 	numblks = blkroundup(fs, bp->b_size) / fs->fs_bsize;
 	if (debug)
 		prtbuf(bp, "copyonwrite: checking %jd block%s in buffer",
 		    (intmax_t)numblks, numblks > 1 ? "s" : "");
 	copyblkno = blknum(fs, dbtofsb(fs, bp->b_bno));
 	for (i = 0; i < numblks; i++) {
 		chkcopyonwrite(fs, copyblkno, checkblkavail);
 		copyblkno += fs->fs_frag;
 	}
 }
 
 static void
-chkcopyonwrite(fs, copyblkno, checkblkavail)
-	struct fs *fs;
-	ufs2_daddr_t copyblkno;
-	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags);
+chkcopyonwrite(struct fs *fs, ufs2_daddr_t copyblkno,
+	ufs2_daddr_t (*checkblkavail)(ufs2_daddr_t blkno, long frags))
 {
 	struct inode ip;
 	union dinode *dp;
 	struct bufarea *snapbp;
 	ufs2_daddr_t blkno;
 	int i, frags, copydone;
 	ufs_lbn_t lbn;
 
 	lbn = fragstoblks(fs, copyblkno);
 	/* Direct blocks are always pre-copied */
 	if (lbn < UFS_NDADDR)
 		return;
 	copydone = 0;
 	for (i = 0; i < snapcnt; i++) {
 		/*
 		 * Lookup block being freed.
 		 */
 		ip = snaplist[i];
 		dp = ip.i_dp;
 		blkno = ino_blkatoff(dp, ip.i_number, lbn, &frags, &snapbp);
 		/*
 		 * Check to see if block needs to be copied.
 		 */
 		if (blkno != 0) {
 			/*
 			 * A block that we have already copied or don't track.
 			 */
 			brelse(snapbp);
 			continue;
 		}
 		/* First time through, read the contents of the old block. */
 		if (copydone == 0) {
 			copydone = 1;
 			if (blread(fsreadfd, copybuf, fsbtodb(fs, copyblkno),
 			    fs->fs_bsize) != 0) {
 				pfatal("Could not read snapshot %ju block "
 				    "%jd\n", (intmax_t)ip.i_number,
 				    (intmax_t)copyblkno);
 				continue;
 			}
 		}
 		/*
 		 * This allocation will never require any additional
 		 * allocations for the snapshot inode.
 		 */
 		if ((blkno = allocblk(dtog(fs, copyblkno), fs->fs_frag,
 		    checkblkavail)) == 0) {
 			pfatal("Could not allocate block for snapshot %ju\n",
 			    (intmax_t)ip.i_number);
 			continue;
 		}
 		if (debug)
 			prtbuf(snapbp, "Copyonwrite: snapino %jd lbn %jd using "
 			    "blkno %ju setting in buffer",
 			    (intmax_t)ip.i_number, (intmax_t)lbn,
 			    (intmax_t)blkno);
 		blwrite(fswritefd, copybuf, fsbtodb(fs, blkno), fs->fs_bsize);
 		IBLK_SET(snapbp, snapbp->b_index, blkno);
 		dirty(snapbp);
 		brelse(snapbp);
 		DIP_SET(dp, di_blocks,
 		    DIP(dp, di_blocks) + btodb(fs->fs_bsize));
 		inodirty(&ip);
 	}
 	return;
 }
 
 /*
  * Traverse an inode and check that its block count is correct
  * fixing it if necessary.
  */
 void
 check_blkcnt(struct inode *ip)
 {
 	struct inodesc idesc;
 	union dinode *dp;
 	ufs2_daddr_t ndb;
 	int j, ret, offset;
 
 	dp = ip->i_dp;
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_func = pass1check;
 	idesc.id_number = ip->i_number;
 	idesc.id_type = (DIP(dp, di_flags) & SF_SNAPSHOT) == 0 ? ADDR : SNAP;
 	(void)ckinode(dp, &idesc);
 	if (sblock.fs_magic == FS_UFS2_MAGIC && dp->dp2.di_extsize > 0) {
 		ndb = howmany(dp->dp2.di_extsize, sblock.fs_bsize);
 		for (j = 0; j < UFS_NXADDR; j++) {
 			if (--ndb == 0 &&
 			    (offset = blkoff(&sblock, dp->dp2.di_extsize)) != 0)
 				idesc.id_numfrags = numfrags(&sblock,
 				    fragroundup(&sblock, offset));
 			else
 				idesc.id_numfrags = sblock.fs_frag;
 			if (dp->dp2.di_extb[j] == 0)
 				continue;
 			idesc.id_blkno = dp->dp2.di_extb[j];
 			ret = (*idesc.id_func)(&idesc);
 			if (ret & STOP)
 				break;
 		}
 	}
 	idesc.id_entryno *= btodb(sblock.fs_fsize);
 	if (DIP(dp, di_blocks) != idesc.id_entryno) {
 		if (!(sujrecovery && preen)) {
 			pwarn("INCORRECT BLOCK COUNT I=%lu (%ju should be %ju)",
 			    (u_long)idesc.id_number,
 			    (uintmax_t)DIP(dp, di_blocks),
 			    (uintmax_t)idesc.id_entryno);
 			if (preen)
 				printf(" (CORRECTED)\n");
 			else if (reply("CORRECT") == 0)
 				return;
 		}
 		if (bkgrdflag == 0) {
 			DIP_SET(dp, di_blocks, idesc.id_entryno);
 			inodirty(ip);
 		} else {
 			cmd.value = idesc.id_number;
 			cmd.size = idesc.id_entryno - DIP(dp, di_blocks);
 			if (debug)
 				printf("adjblkcnt ino %ju amount %lld\n",
 				    (uintmax_t)cmd.value, (long long)cmd.size);
 			if (sysctl(adjblkcnt, MIBSIZE, 0, 0,
 			    &cmd, sizeof cmd) == -1)
 				rwerror("ADJUST INODE BLOCK COUNT", cmd.value);
 		}
 	}
 }
 
 void
 freeinodebuf(void)
 {
 	struct bufarea *bp;
 	int i;
 
 	/*
 	 * Flush old contents in case they have been updated.
 	 */
 	flush(fswritefd, &inobuf);
 	if (inobuf.b_un.b_buf != NULL)
 		free((char *)inobuf.b_un.b_buf);
 	inobuf.b_un.b_buf = NULL;
 	firstinum = lastinum = 0;
 	/*
 	 * Reload the snapshot inodes in case any of them changed.
 	 */
 	for (i = 0; i < snapcnt; i++) {
 		bp = snaplist[i].i_bp;
 		bp->b_errs = blread(fsreadfd, bp->b_un.b_buf, bp->b_bno,
 		    bp->b_size);
 	}
 }
 
 /*
  * Routines to maintain information about directory inodes.
  * This is built during the first pass and used during the
  * second and third passes.
  *
  * Enter inodes into the cache.
  */
 struct inoinfo *
 cacheino(union dinode *dp, ino_t inumber)
 {
 	struct inoinfo *inp;
 	int i, blks;
 
 	if (getinoinfo(inumber) != NULL)
 		pfatal("cacheino: duplicate entry for ino %jd\n",
 		    (intmax_t)inumber);
 	if (howmany(DIP(dp, di_size), sblock.fs_bsize) > UFS_NDADDR)
 		blks = UFS_NDADDR + UFS_NIADDR;
 	else if (DIP(dp, di_size) > 0)
 		blks = howmany(DIP(dp, di_size), sblock.fs_bsize);
 	else
 		blks = 1;
 	inp = (struct inoinfo *)
 		Malloc(sizeof(*inp) + (blks - 1) * sizeof(ufs2_daddr_t));
 	if (inp == NULL)
 		errx(EEXIT, "cannot increase directory list");
 	SLIST_INSERT_HEAD(&inphash[inumber % dirhash], inp, i_hash);
 	inp->i_flags = 0;
 	inp->i_parent = inumber == UFS_ROOTINO ? UFS_ROOTINO : (ino_t)0;
 	inp->i_dotdot = (ino_t)0;
 	inp->i_number = inumber;
 	inp->i_isize = DIP(dp, di_size);
 	inp->i_numblks = blks;
 	for (i = 0; i < MIN(blks, UFS_NDADDR); i++)
 		inp->i_blks[i] = DIP(dp, di_db[i]);
 	if (blks > UFS_NDADDR)
 		for (i = 0; i < UFS_NIADDR; i++)
 			inp->i_blks[UFS_NDADDR + i] = DIP(dp, di_ib[i]);
 	if (inplast == listmax) {
 		listmax += 100;
 		inpsort = (struct inoinfo **)reallocarray((char *)inpsort,
 		    listmax, sizeof(struct inoinfo *));
 		if (inpsort == NULL)
 			errx(EEXIT, "cannot increase directory list");
 	}
 	inpsort[inplast++] = inp;
 	return (inp);
 }
 
 /*
  * Look up an inode cache structure.
  */
 struct inoinfo *
 getinoinfo(ino_t inumber)
 {
 	struct inoinfo *inp;
 
 	SLIST_FOREACH(inp, &inphash[inumber % dirhash], i_hash) {
 		if (inp->i_number != inumber)
 			continue;
 		return (inp);
 	}
 	return (NULL);
 }
 
 /*
  * Remove an entry from the inode cache and disk-order sorted list.
  * Return 0 on success and 1 on failure.
  */
 int
 removecachedino(ino_t inumber)
 {
 	struct inoinfo *inp, **inpp;
 	char *listtype;
 
 	listtype = "hash";
 	SLIST_FOREACH(inp, &inphash[inumber % dirhash], i_hash) {
 		if (inp->i_number != inumber)
 			continue;
 		SLIST_REMOVE(&inphash[inumber % dirhash], inp, inoinfo, i_hash);
 		for (inpp = &inpsort[inplast - 1]; inpp >= inpsort; inpp--) {
 			if (*inpp != inp)
 				continue;
 			*inpp = inpsort[inplast - 1];
 			inplast--;
 			free(inp);
 			return (0);
 		}
 		listtype = "sort";
 		break;
 	}
 	pfatal("removecachedino: entry for ino %jd not found on %s list\n",
 	    (intmax_t)inumber, listtype);
 	return (1);
 }
 
 /*
  * Clean up all the inode cache structure.
  */
 void
 inocleanup(void)
 {
 	struct inoinfo **inpp;
 
 	if (inphash == NULL)
 		return;
 	for (inpp = &inpsort[inplast - 1]; inpp >= inpsort; inpp--)
 		free((char *)(*inpp));
 	free((char *)inphash);
 	inphash = NULL;
 	free((char *)inpsort);
 	inpsort = NULL;
 }
 
 void
 inodirty(struct inode *ip)
 {
 
 	if (sblock.fs_magic == FS_UFS2_MAGIC)
 		ffs_update_dinode_ckhash(&sblock,
 		    (struct ufs2_dinode *)ip->i_dp);
 	dirty(ip->i_bp);
 }
 
 void
 clri(struct inodesc *idesc, const char *type, int flag)
 {
 	union dinode *dp;
 	struct inode ip;
 
 	ginode(idesc->id_number, &ip);
 	dp = ip.i_dp;
 	if (flag == 1) {
 		pwarn("%s %s", type,
 		    (DIP(dp, di_mode) & IFMT) == IFDIR ? "DIR" : "FILE");
 		prtinode(&ip);
 		printf("\n");
 	}
 	if (preen || reply("CLEAR") == 1) {
 		if (preen)
 			printf(" (CLEARED)\n");
 		n_files--;
 		if (bkgrdflag == 0) {
 			if (idesc->id_type == SNAP) {
 				snapremove(idesc->id_number);
 				idesc->id_type = ADDR;
 			}
 			(void)ckinode(dp, idesc);
 			inoinfo(idesc->id_number)->ino_state = USTATE;
 			clearinode(dp);
 			inodirty(&ip);
 		} else {
 			cmd.value = idesc->id_number;
 			cmd.size = -DIP(dp, di_nlink);
 			if (debug)
 				printf("adjrefcnt ino %ld amt %lld\n",
 				    (long)cmd.value, (long long)cmd.size);
 			if (sysctl(adjrefcnt, MIBSIZE, 0, 0,
 			    &cmd, sizeof cmd) == -1)
 				rwerror("ADJUST INODE", cmd.value);
 		}
 	}
 	irelse(&ip);
 }
 
 int
 findname(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 
 	if (dirp->d_ino != idesc->id_parent || idesc->id_entryno < 2) {
 		idesc->id_entryno++;
 		return (KEEPON);
 	}
 	memmove(idesc->id_name, dirp->d_name, (size_t)dirp->d_namlen + 1);
 	return (STOP|FOUND);
 }
 
 int
 findino(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 
 	if (dirp->d_ino == 0)
 		return (KEEPON);
 	if (strcmp(dirp->d_name, idesc->id_name) == 0 &&
 	    dirp->d_ino >= UFS_ROOTINO && dirp->d_ino <= maxino) {
 		idesc->id_parent = dirp->d_ino;
 		return (STOP|FOUND);
 	}
 	return (KEEPON);
 }
 
 int
 clearentry(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 
 	if (dirp->d_ino != idesc->id_parent || idesc->id_entryno < 2) {
 		idesc->id_entryno++;
 		return (KEEPON);
 	}
 	dirp->d_ino = 0;
 	return (STOP|FOUND|ALTERED);
 }
 
 void
 prtinode(struct inode *ip)
 {
 	char *p;
 	union dinode *dp;
 	struct passwd *pw;
 	time_t t;
 
 	dp = ip->i_dp;
 	printf(" I=%lu ", (u_long)ip->i_number);
 	if (ip->i_number < UFS_ROOTINO || ip->i_number > maxino)
 		return;
 	printf(" OWNER=");
 	if ((pw = getpwuid((int)DIP(dp, di_uid))) != NULL)
 		printf("%s ", pw->pw_name);
 	else
 		printf("%u ", (unsigned)DIP(dp, di_uid));
 	printf("MODE=%o\n", DIP(dp, di_mode));
 	if (preen)
 		printf("%s: ", cdevname);
 	printf("SIZE=%ju ", (uintmax_t)DIP(dp, di_size));
 	t = DIP(dp, di_mtime);
 	if ((p = ctime(&t)) != NULL)
 		printf("MTIME=%12.12s %4.4s ", &p[4], &p[20]);
 }
 
 void
 blkerror(ino_t ino, const char *type, ufs2_daddr_t blk)
 {
 
 	pfatal("%jd %s I=%ju", (intmax_t)blk, type, (uintmax_t)ino);
 	printf("\n");
 	switch (inoinfo(ino)->ino_state) {
 
 	case FSTATE:
 	case FZLINK:
 		inoinfo(ino)->ino_state = FCLEAR;
 		return;
 
 	case DSTATE:
 	case DZLINK:
 		inoinfo(ino)->ino_state = DCLEAR;
 		return;
 
 	case FCLEAR:
 	case DCLEAR:
 		return;
 
 	default:
 		errx(EEXIT, "BAD STATE %d TO BLKERR", inoinfo(ino)->ino_state);
 		/* NOTREACHED */
 	}
 }
 
 /*
  * allocate an unused inode
  */
 ino_t
 allocino(ino_t request, int type)
 {
 	ino_t ino;
 	struct inode ip;
 	union dinode *dp;
 	struct bufarea *cgbp;
 	struct cg *cgp;
 	int cg, anyino;
 
 	anyino = 0;
 	if (request == 0) {
 		request = UFS_ROOTINO;
 		anyino = 1;
 	} else if (inoinfo(request)->ino_state != USTATE)
 		return (0);
 retry:
 	for (ino = request; ino < maxino; ino++)
 		if (inoinfo(ino)->ino_state == USTATE)
 			break;
 	if (ino >= maxino)
 		return (0);
 	cg = ino_to_cg(&sblock, ino);
 	cgbp = cglookup(cg);
 	cgp = cgbp->b_un.b_cg;
 	if (!check_cgmagic(cg, cgbp, 0)) {
 		if (anyino == 0)
 			return (0);
 		request = (cg + 1) * sblock.fs_ipg;
 		goto retry;
 	}
 	setbit(cg_inosused(cgp), ino % sblock.fs_ipg);
 	cgp->cg_cs.cs_nifree--;
 	switch (type & IFMT) {
 	case IFDIR:
 		inoinfo(ino)->ino_state = DSTATE;
 		cgp->cg_cs.cs_ndir++;
 		break;
 	case IFREG:
 	case IFLNK:
 		inoinfo(ino)->ino_state = FSTATE;
 		break;
 	default:
 		return (0);
 	}
 	cgdirty(cgbp);
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	DIP_SET(dp, di_db[0], allocblk(ino_to_cg(&sblock, ino), (long)1,
 	    std_checkblkavail));
 	if (DIP(dp, di_db[0]) == 0) {
 		inoinfo(ino)->ino_state = USTATE;
 		irelse(&ip);
 		return (0);
 	}
 	DIP_SET(dp, di_mode, type);
 	DIP_SET(dp, di_flags, 0);
 	DIP_SET(dp, di_atime, time(NULL));
 	DIP_SET(dp, di_ctime, DIP(dp, di_atime));
 	DIP_SET(dp, di_mtime, DIP(dp, di_ctime));
 	DIP_SET(dp, di_mtimensec, 0);
 	DIP_SET(dp, di_ctimensec, 0);
 	DIP_SET(dp, di_atimensec, 0);
 	DIP_SET(dp, di_size, sblock.fs_fsize);
 	DIP_SET(dp, di_blocks, btodb(sblock.fs_fsize));
 	n_files++;
 	inodirty(&ip);
 	irelse(&ip);
 	inoinfo(ino)->ino_type = IFTODT(type);
 	return (ino);
 }
 
 /*
  * deallocate an inode
  */
 void
 freeino(ino_t ino)
 {
 	struct inodesc idesc;
 	union dinode *dp;
 	struct inode ip;
 
 	memset(&idesc, 0, sizeof(struct inodesc));
 	idesc.id_type = ADDR;
 	idesc.id_func = freeblock;
 	idesc.id_number = ino;
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	(void)ckinode(dp, &idesc);
 	clearinode(dp);
 	inodirty(&ip);
 	irelse(&ip);
 	inoinfo(ino)->ino_state = USTATE;
 	n_files--;
 }
diff --git a/sbin/fsck_ffs/pass2.c b/sbin/fsck_ffs/pass2.c
index 4e17863ef04c..abe14549e6f4 100644
--- a/sbin/fsck_ffs/pass2.c
+++ b/sbin/fsck_ffs/pass2.c
@@ -1,733 +1,734 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 1980, 1986, 1993
  *	The Regents of the University of California.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  * 3. Neither the name of the University nor the names of its contributors
  *    may be used to endorse or promote products derived from this software
  *    without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #if 0
 #ifndef lint
 static const char sccsid[] = "@(#)pass2.c	8.9 (Berkeley) 4/28/95";
 #endif /* not lint */
 #endif
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/sysctl.h>
 
 #include <ufs/ufs/dinode.h>
 #include <ufs/ufs/dir.h>
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <errno.h>
 #include <stdint.h>
 #include <string.h>
 
 #include "fsck.h"
 
 #define MINDIRSIZE	(sizeof (struct dirtemplate))
 
 static int fix_extraneous(struct inoinfo *, struct inodesc *);
 static int deleteentry(struct inodesc *);
 static int blksort(const void *, const void *);
 static int pass2check(struct inodesc *);
 
 void
 pass2(void)
 {
 	struct inode ip;
 	union dinode *dp;
 	struct inoinfo **inpp, *inp;
 	struct inoinfo **inpend;
 	struct inodesc curino;
 	union dinode dino;
 	int i;
 	char pathbuf[MAXPATHLEN + 1];
 
 	switch (inoinfo(UFS_ROOTINO)->ino_state) {
 
 	case USTATE:
 		pfatal("ROOT INODE UNALLOCATED");
 		if (reply("ALLOCATE") == 0) {
 			ckfini(0);
 			exit(EEXIT);
 		}
 		if (allocdir(UFS_ROOTINO, UFS_ROOTINO, 0755) != UFS_ROOTINO)
 			errx(EEXIT, "CANNOT ALLOCATE ROOT INODE");
 		break;
 
 	case DCLEAR:
 		pfatal("DUPS/BAD IN ROOT INODE");
 		if (reply("REALLOCATE")) {
 			freedirino(UFS_ROOTINO, UFS_ROOTINO);
 			if (allocdir(UFS_ROOTINO, UFS_ROOTINO, 0755) !=
 			    UFS_ROOTINO)
 				errx(EEXIT, "CANNOT ALLOCATE ROOT INODE");
 			break;
 		}
 		if (reply("CONTINUE") == 0) {
 			ckfini(0);
 			exit(EEXIT);
 		}
 		break;
 
 	case FSTATE:
 	case FCLEAR:
 	case FZLINK:
 		pfatal("ROOT INODE NOT DIRECTORY");
 		if (reply("REALLOCATE")) {
 			freeino(UFS_ROOTINO);
 			if (allocdir(UFS_ROOTINO, UFS_ROOTINO, 0755) !=
 			    UFS_ROOTINO)
 				errx(EEXIT, "CANNOT ALLOCATE ROOT INODE");
 			break;
 		}
 		if (reply("FIX") == 0) {
 			ckfini(0);
 			exit(EEXIT);
 		}
 		ginode(UFS_ROOTINO, &ip);
 		dp = ip.i_dp;
 		DIP_SET(dp, di_mode, DIP(dp, di_mode) & ~IFMT);
 		DIP_SET(dp, di_mode, DIP(dp, di_mode) | IFDIR);
 		inodirty(&ip);
 		irelse(&ip);
 		break;
 
 	case DSTATE:
 	case DZLINK:
 		break;
 
 	default:
 		errx(EEXIT, "BAD STATE %d FOR ROOT INODE",
 		    inoinfo(UFS_ROOTINO)->ino_state);
 	}
 	inoinfo(UFS_ROOTINO)->ino_state = DFOUND;
 	inoinfo(UFS_WINO)->ino_state = FSTATE;
 	inoinfo(UFS_WINO)->ino_type = DT_WHT;
 	/*
 	 * Sort the directory list into disk block order.
 	 */
 	qsort((char *)inpsort, (size_t)inplast, sizeof *inpsort, blksort);
 	/*
 	 * Check the integrity of each directory.
 	 */
 	memset(&curino, 0, sizeof(struct inodesc));
 	curino.id_type = DATA;
 	curino.id_func = pass2check;
 	inpend = &inpsort[inplast];
 	for (inpp = inpsort; inpp < inpend; inpp++) {
 		if (got_siginfo) {
 			printf("%s: phase 2: dir %td of %d (%d%%)\n", cdevname,
 			    inpp - inpsort, (int)inplast,
 			    (int)((inpp - inpsort) * 100 / inplast));
 			got_siginfo = 0;
 		}
 		if (got_sigalarm) {
 			setproctitle("%s p2 %d%%", cdevname,
 			    (int)((inpp - inpsort) * 100 / inplast));
 			got_sigalarm = 0;
 		}
 		inp = *inpp;
 		if (inp->i_isize == 0)
 			continue;
 		if (inp->i_isize < MINDIRSIZE) {
 			direrror(inp->i_number, "DIRECTORY TOO SHORT");
 			inp->i_isize = roundup(MINDIRSIZE, DIRBLKSIZ);
 			if (reply("FIX") == 1) {
 				ginode(inp->i_number, &ip);
 				DIP_SET(ip.i_dp, di_size, inp->i_isize);
 				inodirty(&ip);
 				irelse(&ip);
 			}
 		} else if ((inp->i_isize & (DIRBLKSIZ - 1)) != 0) {
 			getpathname(pathbuf, inp->i_number, inp->i_number);
 			if (usedsoftdep)
 				pfatal("%s %s: LENGTH %jd NOT MULTIPLE OF %d",
 					"DIRECTORY", pathbuf,
 					(intmax_t)inp->i_isize, DIRBLKSIZ);
 			else
 				pwarn("%s %s: LENGTH %jd NOT MULTIPLE OF %d",
 					"DIRECTORY", pathbuf,
 					(intmax_t)inp->i_isize, DIRBLKSIZ);
 			if (preen)
 				printf(" (ADJUSTED)\n");
 			inp->i_isize = roundup(inp->i_isize, DIRBLKSIZ);
 			if (preen || reply("ADJUST") == 1) {
 				ginode(inp->i_number, &ip);
 				DIP_SET(ip.i_dp, di_size,
 				    roundup(inp->i_isize, DIRBLKSIZ));
 				inodirty(&ip);
 				irelse(&ip);
 			}
 		}
 		dp = &dino;
 		memset(dp, 0, sizeof(struct ufs2_dinode));
 		DIP_SET(dp, di_mode, IFDIR);
 		DIP_SET(dp, di_size, inp->i_isize);
 		for (i = 0; i < MIN(inp->i_numblks, UFS_NDADDR); i++)
 			DIP_SET(dp, di_db[i], inp->i_blks[i]);
 		if (inp->i_numblks > UFS_NDADDR)
 			for (i = 0; i < UFS_NIADDR; i++)
 				DIP_SET(dp, di_ib[i],
 				    inp->i_blks[UFS_NDADDR + i]);
 		curino.id_number = inp->i_number;
 		curino.id_parent = inp->i_parent;
 		(void)ckinode(dp, &curino);
 	}
 	/*
 	 * Now that the parents of all directories have been found,
 	 * make another pass to verify the value of `..'
 	 */
 	for (inpp = inpsort; inpp < inpend; inpp++) {
 		inp = *inpp;
 		if (inp->i_parent == 0 || inp->i_isize == 0)
 			continue;
 		if (inoinfo(inp->i_parent)->ino_state == DFOUND &&
 		    INO_IS_DUNFOUND(inp->i_number))
 			inoinfo(inp->i_number)->ino_state = DFOUND;
 		if (inp->i_dotdot == inp->i_parent ||
 		    inp->i_dotdot == (ino_t)-1)
 			continue;
 		if (inp->i_dotdot == 0) {
 			inp->i_dotdot = inp->i_parent;
 			if (debug)
 				fileerror(inp->i_parent, inp->i_number,
 				    "DEFERRED MISSING '..' FIX");
 			(void)makeentry(inp->i_number, inp->i_parent, "..");
 			inoinfo(inp->i_parent)->ino_linkcnt--;
 			continue;
 		}
 		/*
 		 * Here we have:
 		 *    inp->i_number is directory with bad ".." in it.
 		 *    inp->i_dotdot is current value of "..".
 		 *    inp->i_parent is directory to which ".." should point.
 		 */
 		getpathname(pathbuf, inp->i_parent, inp->i_number);
 		printf("BAD INODE NUMBER FOR '..' in DIR I=%ju (%s)\n",
 		    (uintmax_t)inp->i_number, pathbuf);
 		getpathname(pathbuf, inp->i_dotdot, inp->i_dotdot);
 		printf("CURRENTLY POINTS TO I=%ju (%s), ",
 		    (uintmax_t)inp->i_dotdot, pathbuf);
 		getpathname(pathbuf, inp->i_parent, inp->i_parent);
 		printf("SHOULD POINT TO I=%ju (%s)",
 		    (uintmax_t)inp->i_parent, pathbuf);
 		if (cursnapshot != 0) {
 			/*
 			 * We need to:
 			 *    setcwd(inp->i_number);
 			 *    setdotdot(inp->i_dotdot, inp->i_parent);
 			 */
 			cmd.value = inp->i_number;
 			if (sysctlbyname("vfs.ffs.setcwd", 0, 0,
 			    &cmd, sizeof cmd) == -1) {
 				/* kernel lacks support for these functions */
 				printf(" (IGNORED)\n");
 				continue;
 			}
 			cmd.value = inp->i_dotdot; /* verify same value */
 			cmd.size = inp->i_parent;  /* new parent */
 			if (sysctlbyname("vfs.ffs.setdotdot", 0, 0,
 			    &cmd, sizeof cmd) == -1) {
 				printf(" (FIX FAILED: %s)\n", strerror(errno));
 				continue;
 			}
 			printf(" (FIXED)\n");
 			inoinfo(inp->i_parent)->ino_linkcnt--;
 			inp->i_dotdot = inp->i_parent;
 			continue;
 		}
 		if (preen)
 			printf(" (FIXED)\n");
 		else if (reply("FIX") == 0)
 			continue;
 		inoinfo(inp->i_dotdot)->ino_linkcnt++;
 		inoinfo(inp->i_parent)->ino_linkcnt--;
 		inp->i_dotdot = inp->i_parent;
 		(void)changeino(inp->i_number, "..", inp->i_parent);
 	}
 	/*
 	 * Mark all the directories that can be found from the root.
 	 */
 	propagate();
 }
 
 static int
 pass2check(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 	char dirname[MAXPATHLEN + 1];
 	struct inoinfo *inp;
 	int n, entrysize, ret = 0;
 	struct inode ip;
 	union dinode *dp;
 	const char *errmsg;
 	struct direct proto, *newdirp;
 
 	/*
 	 * check for "."
 	 */
 	if (idesc->id_entryno != 0)
 		goto chk1;
 	if (dirp->d_ino != 0 && strcmp(dirp->d_name, ".") == 0) {
 		if (dirp->d_ino != idesc->id_number) {
 			direrror(idesc->id_number, "BAD INODE NUMBER FOR '.'");
 			if (reply("FIX") == 1) {
 				dirp->d_ino = idesc->id_number;
 				ret |= ALTERED;
 			}
 		}
 		if (dirp->d_type != DT_DIR) {
 			direrror(idesc->id_number, "BAD TYPE VALUE FOR '.'");
 			if (reply("FIX") == 1) {
 				dirp->d_type = DT_DIR;
 				ret |= ALTERED;
 			}
 		}
 		goto chk1;
 	}
 	proto.d_ino = idesc->id_number;
 	proto.d_type = DT_DIR;
 	proto.d_namlen = 1;
 	(void)strcpy(proto.d_name, ".");
 	entrysize = DIRSIZ(0, &proto);
 	direrror(idesc->id_number, "MISSING '.'");
 	errmsg = "ADD '.' ENTRY";
 	if (dirp->d_reclen < entrysize + DIRSIZ(0, dirp)) {
 		/* Not enough space to add '.', replace first entry with '.' */
 		if (dirp->d_ino != 0) {
 			pwarn("\nFIRST ENTRY IN DIRECTORY CONTAINS %s\n",
 			     dirp->d_name);
 			errmsg = "REPLACE WITH '.'";
 		}
 		if (reply(errmsg) == 0)
 			goto chk1;
 		proto.d_reclen = dirp->d_reclen;
 		memmove(dirp, &proto, (size_t)entrysize);
 		ret |= ALTERED;
 	} else {
 		/* Move over first entry and add '.' entry */
 		if (reply(errmsg) == 0)
 			goto chk1;
 		newdirp = (struct direct *)((char *)(dirp) + entrysize);
 		dirp->d_reclen -= entrysize;
 		memmove(newdirp, dirp, dirp->d_reclen);
 		proto.d_reclen = entrysize;
 		memmove(dirp, &proto, (size_t)entrysize);
 		idesc->id_entryno++;
 		inoinfo(idesc->id_number)->ino_linkcnt--;
 		dirp = newdirp;
 		ret |= ALTERED;
 	}
 chk1:
 	if (idesc->id_entryno > 1)
 		goto chk2;
 	inp = getinoinfo(idesc->id_number);
 	proto.d_ino = inp->i_parent;
 	proto.d_type = DT_DIR;
 	proto.d_namlen = 2;
 	(void)strcpy(proto.d_name, "..");
 	entrysize = DIRSIZ(0, &proto);
 	if (idesc->id_entryno == 0) {
 		n = DIRSIZ(0, dirp);
 		if (dirp->d_reclen < n + entrysize)
 			goto chk2;
 		proto.d_reclen = dirp->d_reclen - n;
 		dirp->d_reclen = n;
 		idesc->id_entryno++;
 		inoinfo(dirp->d_ino)->ino_linkcnt--;
 		dirp = (struct direct *)((char *)(dirp) + n);
 		memset(dirp, 0, (size_t)proto.d_reclen);
 		dirp->d_reclen = proto.d_reclen;
 	}
 	if (dirp->d_ino != 0 && strcmp(dirp->d_name, "..") == 0) {
 		if (dirp->d_ino > maxino) {
 			direrror(idesc->id_number, "BAD INODE NUMBER FOR '..'");
 			/*
 			 * If we know parent set it now, otherwise let it
 			 * point to the root inode and it will get cleaned
 			 * up later if that is not correct.
 			 */
 			if (inp->i_parent != 0)
 				dirp->d_ino = inp->i_parent;
 			else
 				dirp->d_ino = UFS_ROOTINO;
 			if (reply("FIX") == 1)
 				ret |= ALTERED;
 		}
 		inp->i_dotdot = dirp->d_ino;
 		if (dirp->d_type != DT_DIR) {
 			direrror(idesc->id_number, "BAD TYPE VALUE FOR '..'");
 			dirp->d_type = DT_DIR;
 			if (reply("FIX") == 1)
 				ret |= ALTERED;
 		}
 		goto chk2;
 	}
 	fileerror(inp->i_parent != 0 ? inp->i_parent : idesc->id_number,
 	    idesc->id_number, "MISSING '..'");
 	errmsg = "ADD '..' ENTRY";
 	if (dirp->d_reclen < entrysize + DIRSIZ(0, dirp)) {
 		/* No space to add '..', replace second entry with '..' */
 		if (dirp->d_ino != 0) {
 			pfatal("SECOND ENTRY IN DIRECTORY CONTAINS %s\n",
 			    dirp->d_name);
 			errmsg = "REPLACE WITH '..'";
 		}
 		if (reply(errmsg) == 0) {
 			inp->i_dotdot = (ino_t)-1;
 			goto chk2;
 		}
 		if (proto.d_ino == 0) {
 			/* Defer processing until parent known */
 			idesc->id_entryno++;
 			if (debug)
 				printf("(FIX DEFERRED)\n");
 		}
 		inp->i_dotdot = proto.d_ino;
 		proto.d_reclen = dirp->d_reclen;
 		memmove(dirp, &proto, (size_t)entrysize);
 		ret |= ALTERED;
 	} else {
 		/* Move over second entry and add '..' entry */
 		if (reply(errmsg) == 0) {
 			inp->i_dotdot = (ino_t)-1;
 			goto chk2;
 		}
 		if (proto.d_ino == 0) {
 			/* Defer processing until parent known */
 			idesc->id_entryno++;
 			if (debug)
 				printf("(FIX DEFERRED)\n");
 		}
 		inp->i_dotdot = proto.d_ino;
 		if (dirp->d_ino == 0) {
 			proto.d_reclen = dirp->d_reclen;
 			memmove(dirp, &proto, (size_t)entrysize);
 		} else {
 			newdirp = (struct direct *)((char *)(dirp) + entrysize);
 			dirp->d_reclen -= entrysize;
 			memmove(newdirp, dirp, dirp->d_reclen);
 			proto.d_reclen = entrysize;
 			memmove(dirp, &proto, (size_t)entrysize);
 			if (dirp->d_ino != 0) {
 				idesc->id_entryno++;
 				inoinfo(dirp->d_ino)->ino_linkcnt--;
 			}
 			dirp = newdirp;
 		}
 		ret |= ALTERED;
 	}
 chk2:
 	if (dirp->d_ino == 0)
 		return (ret|KEEPON);
 	if (dirp->d_namlen <= 2 &&
 	    dirp->d_name[0] == '.' &&
 	    idesc->id_entryno >= 2) {
 		if (dirp->d_namlen == 1) {
 			direrror(idesc->id_number, "EXTRA '.' ENTRY");
 			dirp->d_ino = 0;
 			if (reply("FIX") == 1)
 				ret |= ALTERED;
 			return (KEEPON | ret);
 		}
 		if (dirp->d_name[1] == '.') {
 			direrror(idesc->id_number, "EXTRA '..' ENTRY");
 			dirp->d_ino = 0;
 			if (reply("FIX") == 1)
 				ret |= ALTERED;
 			return (KEEPON | ret);
 		}
 	}
 	idesc->id_entryno++;
 	n = 0;
 	if (dirp->d_ino > maxino) {
 		fileerror(idesc->id_number, dirp->d_ino, "I OUT OF RANGE");
 		n = reply("REMOVE");
 	} else if (((dirp->d_ino == UFS_WINO && dirp->d_type != DT_WHT) ||
 		    (dirp->d_ino != UFS_WINO && dirp->d_type == DT_WHT))) {
 		fileerror(idesc->id_number, dirp->d_ino, "BAD WHITEOUT ENTRY");
 		dirp->d_ino = UFS_WINO;
 		dirp->d_type = DT_WHT;
 		if (reply("FIX") == 1)
 			ret |= ALTERED;
 	} else {
 again:
 		switch (inoinfo(dirp->d_ino)->ino_state) {
 		case USTATE:
 			if (idesc->id_entryno <= 2)
 				break;
 			fileerror(idesc->id_number, dirp->d_ino, "UNALLOCATED");
 			n = reply("REMOVE");
 			break;
 
 		case DCLEAR:
 		case FCLEAR:
 			if (idesc->id_entryno <= 2)
 				break;
 			if (inoinfo(dirp->d_ino)->ino_state == FCLEAR)
 				errmsg = "DUP/BAD";
 			else if (!preen && !usedsoftdep)
 				errmsg = "ZERO LENGTH DIRECTORY";
 			else if (cursnapshot == 0) {
 				n = 1;
 				break;
 			} else {
 				getpathname(dirname, idesc->id_number,
 				    dirp->d_ino);
 				pwarn("ZERO LENGTH DIRECTORY %s I=%ju",
 				    dirname, (uintmax_t)dirp->d_ino);
 				/*
 				 * We need to:
 				 *    setcwd(idesc->id_parent);
 				 *    rmdir(dirp->d_name);
 				 */
 				cmd.value = idesc->id_number;
 				if (sysctlbyname("vfs.ffs.setcwd", 0, 0,
 				    &cmd, sizeof cmd) == -1) {
 					/* kernel lacks support */
 					printf(" (IGNORED)\n");
 					n = 1;
 					break;
 				}
 				if (rmdir(dirp->d_name) == -1) {
 					printf(" (REMOVAL FAILED: %s)\n",
 					    strerror(errno));
 					n = 1;
 					break;
 				}
 				/* ".." reference to parent is removed */
 				inoinfo(idesc->id_number)->ino_linkcnt--;
 				printf(" (REMOVED)\n");
 				break;
 			}
 			fileerror(idesc->id_number, dirp->d_ino, errmsg);
 			if ((n = reply("REMOVE")) == 1)
 				break;
 			ginode(dirp->d_ino, &ip);
 			dp = ip.i_dp;
 			inoinfo(dirp->d_ino)->ino_state =
 			   (DIP(dp, di_mode) & IFMT) == IFDIR ? DSTATE : FSTATE;
 			inoinfo(dirp->d_ino)->ino_linkcnt = DIP(dp, di_nlink);
 			irelse(&ip);
 			goto again;
 
 		case DSTATE:
 		case DZLINK:
 			if (inoinfo(idesc->id_number)->ino_state == DFOUND)
 				inoinfo(dirp->d_ino)->ino_state = DFOUND;
 			/* FALLTHROUGH */
 
 		case DFOUND:
 			inp = getinoinfo(dirp->d_ino);
 			if (idesc->id_entryno > 2) {
 				if (inp->i_parent == 0)
 					inp->i_parent = idesc->id_number;
 				else if ((n = fix_extraneous(inp, idesc)) == 1)
 					break;
 			}
 			/* FALLTHROUGH */
 
 		case FSTATE:
 		case FZLINK:
 			if (dirp->d_type != inoinfo(dirp->d_ino)->ino_type) {
 				fileerror(idesc->id_number, dirp->d_ino,
 				    "BAD TYPE VALUE");
 				dirp->d_type = inoinfo(dirp->d_ino)->ino_type;
 				if (reply("FIX") == 1)
 					ret |= ALTERED;
 			}
 			inoinfo(dirp->d_ino)->ino_linkcnt--;
 			break;
 
 		default:
 			errx(EEXIT, "BAD STATE %d FOR INODE I=%ju",
 			    inoinfo(dirp->d_ino)->ino_state,
 			    (uintmax_t)dirp->d_ino);
 		}
 	}
 	if (n == 0)
 		return (ret|KEEPON);
 	dirp->d_ino = 0;
 	return (ret|KEEPON|ALTERED);
 }
 
 static int
 fix_extraneous(struct inoinfo *inp, struct inodesc *idesc)
 {
 	char *cp;
 	struct inode ip;
 	struct inodesc dotdesc;
 	char oldname[MAXPATHLEN + 1];
 	char newname[MAXPATHLEN + 1];
 
 	/*
 	 * If we have not yet found "..", look it up now so we know
 	 * which inode the directory itself believes is its parent.
 	 */
 	if (inp->i_dotdot == 0) {
 		memset(&dotdesc, 0, sizeof(struct inodesc));
 		dotdesc.id_type = DATA;
 		dotdesc.id_number = idesc->id_dirp->d_ino;
 		dotdesc.id_func = findino;
 		dotdesc.id_name = strdup("..");
 		ginode(dotdesc.id_number, &ip);
 		if ((ckinode(ip.i_dp, &dotdesc) & FOUND))
 			inp->i_dotdot = dotdesc.id_parent;
 		irelse(&ip);
+		free(dotdesc.id_name);
 	}
 	/*
 	 * We have the previously found old name (inp->i_parent) and the
 	 * just found new name (idesc->id_number). We have five cases:
 	 * 1)  ".." is missing - can remove either name, choose to delete
 	 *     new one and let fsck create ".." pointing to old name.
 	 * 2) Both new and old are in same directory, choose to delete
 	 *    the new name and let fsck fix ".." if it is wrong.
 	 * 3) ".." does not point to the new name, so delete it and let
 	 *    fsck fix ".." to point to the old one if it is wrong.
 	 * 4) ".." points to the old name only, so delete the new one.
 	 * 5) ".." points to the new name only, so delete the old one.
 	 *
 	 * For cases 1-4 we eliminate the new name;
 	 * for case 5 we eliminate the old name.
 	 */
 	if (inp->i_dotdot == 0 ||		    /* Case 1 */
 	    idesc->id_number == inp->i_parent ||    /* Case 2 */
 	    inp->i_dotdot != idesc->id_number ||    /* Case 3 */
 	    inp->i_dotdot == inp->i_parent) {	    /* Case 4 */
 		getpathname(newname, idesc->id_number, idesc->id_number);
 		if (strcmp(newname, "/") != 0)
 			strcat (newname, "/");
 		strcat(newname, idesc->id_dirp->d_name);
 		getpathname(oldname, inp->i_number, inp->i_number);
 		pwarn("%s IS AN EXTRANEOUS HARD LINK TO DIRECTORY %s",
 		    newname, oldname);
 		if (cursnapshot != 0) {
 			/*
 			 * We need to
 			 *    setcwd(idesc->id_number);
 			 *    unlink(idesc->id_dirp->d_name);
 			 */
 			cmd.value = idesc->id_number;
 			if (sysctlbyname("vfs.ffs.setcwd", 0, 0,
 			    &cmd, sizeof cmd) == -1) {
 				printf(" (IGNORED)\n");
 				return (0);
 			}
 			cmd.value = (intptr_t)idesc->id_dirp->d_name;
 			cmd.size = inp->i_number; /* verify same name */
 			if (sysctlbyname("vfs.ffs.unlink", 0, 0,
 			    &cmd, sizeof cmd) == -1) {
 				printf(" (UNLINK FAILED: %s)\n",
 				    strerror(errno));
 				return (0);
 			}
 			printf(" (REMOVED)\n");
 			return (0);
 		}
 		if (preen) {
 			printf(" (REMOVED)\n");
 			return (1);
 		}
 		return (reply("REMOVE"));
 	}
 	/*
 	 * None of the first four cases above, so must be case (5).
 	 * Eliminate the old name and make the new the name the parent.
 	 */
 	getpathname(oldname, inp->i_parent, inp->i_number);
 	getpathname(newname, inp->i_number, inp->i_number);
 	pwarn("%s IS AN EXTRANEOUS HARD LINK TO DIRECTORY %s", oldname,
 	    newname);
 	if (cursnapshot != 0) {
 		/*
 		 * We need to
 		 *    setcwd(inp->i_parent);
 		 *    unlink(last component of oldname pathname);
 		 */
 		cmd.value = inp->i_parent;
 		if (sysctlbyname("vfs.ffs.setcwd", 0, 0,
 		    &cmd, sizeof cmd) == -1) {
 			printf(" (IGNORED)\n");
 			return (0);
 		}
 		if ((cp = strchr(oldname, '/')) == NULL) {
 			printf(" (IGNORED)\n");
 			return (0);
 		}
 		cmd.value = (intptr_t)(cp + 1);
 		cmd.size = inp->i_number; /* verify same name */
 		if (sysctlbyname("vfs.ffs.unlink", 0, 0,
 		    &cmd, sizeof cmd) == -1) {
 			printf(" (UNLINK FAILED: %s)\n",
 			    strerror(errno));
 			return (0);
 		}
 		printf(" (REMOVED)\n");
 		inp->i_parent = idesc->id_number;  /* reparent to correct dir */
 		return (0);
 	}
 	if (!preen && !reply("REMOVE"))
 		return (0);
 	memset(&dotdesc, 0, sizeof(struct inodesc));
 	dotdesc.id_type = DATA;
 	dotdesc.id_number = inp->i_parent; /* directory in which name appears */
 	dotdesc.id_parent = inp->i_number; /* inode number in entry to delete */
 	dotdesc.id_func = deleteentry;
 	ginode(dotdesc.id_number, &ip);
 	if ((ckinode(ip.i_dp, &dotdesc) & FOUND) && preen)
 		printf(" (REMOVED)\n");
 	irelse(&ip);
 	inp->i_parent = idesc->id_number;  /* reparent to correct directory */
 	inoinfo(inp->i_number)->ino_linkcnt++; /* name gone, return reference */
 	return (0);
 }
 
 static int
 deleteentry(struct inodesc *idesc)
 {
 	struct direct *dirp = idesc->id_dirp;
 
 	if (idesc->id_entryno++ < 2 || dirp->d_ino != idesc->id_parent)
 		return (KEEPON);
 	dirp->d_ino = 0;
 	return (ALTERED|STOP|FOUND);
 }
 
 /*
  * Routine to sort disk blocks.
  */
 static int
 blksort(const void *arg1, const void *arg2)
 {
 
 	return ((*(struct inoinfo * const *)arg1)->i_blks[0] -
 		(*(struct inoinfo * const *)arg2)->i_blks[0]);
 }
diff --git a/sbin/fsck_ffs/suj.c b/sbin/fsck_ffs/suj.c
index e9f5bbd421b1..a1d624392fcf 100644
--- a/sbin/fsck_ffs/suj.c
+++ b/sbin/fsck_ffs/suj.c
@@ -1,2522 +1,2520 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright 2009, 2010 Jeffrey W. Roberson <jeff@FreeBSD.org>
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/disk.h>
 #include <sys/disklabel.h>
 #include <sys/mount.h>
 #include <sys/stat.h>
 
 #include <ufs/ufs/ufsmount.h>
 #include <ufs/ufs/dinode.h>
 #include <ufs/ufs/dir.h>
 #include <ufs/ffs/fs.h>
 
 #include <assert.h>
 #include <err.h>
 #include <setjmp.h>
 #include <stdarg.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <stdint.h>
 #include <libufs.h>
 #include <string.h>
 #include <strings.h>
 #include <sysexits.h>
 #include <time.h>
 
 #include "fsck.h"
 
 #define	DOTDOT_OFFSET	DIRECTSIZ(1)
 
 struct suj_seg {
 	TAILQ_ENTRY(suj_seg) ss_next;
 	struct jsegrec	ss_rec;
 	uint8_t		*ss_blk;
 };
 
 struct suj_rec {
 	TAILQ_ENTRY(suj_rec) sr_next;
 	union jrec	*sr_rec;
 };
 TAILQ_HEAD(srechd, suj_rec);
 
 struct suj_ino {
 	LIST_ENTRY(suj_ino)	si_next;
 	struct srechd		si_recs;
 	struct srechd		si_newrecs;
 	struct srechd		si_movs;
 	struct jtrncrec		*si_trunc;
 	ino_t			si_ino;
 	char			si_skipparent;
 	char			si_hasrecs;
 	char			si_blkadj;
 	char			si_linkadj;
 	int			si_mode;
 	nlink_t			si_nlinkadj;
 	nlink_t			si_nlink;
 	nlink_t			si_dotlinks;
 };
 LIST_HEAD(inohd, suj_ino);
 
 struct suj_blk {
 	LIST_ENTRY(suj_blk)	sb_next;
 	struct srechd		sb_recs;
 	ufs2_daddr_t		sb_blk;
 };
 LIST_HEAD(blkhd, suj_blk);
 
 struct suj_cg {
 	LIST_ENTRY(suj_cg)	sc_next;
 	struct blkhd		sc_blkhash[HASHSIZE];
 	struct inohd		sc_inohash[HASHSIZE];
 	struct ino_blk		*sc_lastiblk;
 	struct suj_ino		*sc_lastino;
 	struct suj_blk		*sc_lastblk;
 	struct bufarea		*sc_cgbp;
 	struct cg		*sc_cgp;
 	int			sc_cgx;
 };
 
 static LIST_HEAD(cghd, suj_cg) cghash[HASHSIZE];
 static struct suj_cg *lastcg;
 
 static TAILQ_HEAD(seghd, suj_seg) allsegs;
 static uint64_t oldseq;
 static struct fs *fs = NULL;
 static ino_t sujino;
 
 /*
  * Summary statistics.
  */
 static uint64_t freefrags;
 static uint64_t freeblocks;
 static uint64_t freeinos;
 static uint64_t freedir;
 static uint64_t jbytes;
 static uint64_t jrecs;
 
 static jmp_buf	jmpbuf;
 
 typedef void (*ino_visitor)(ino_t, ufs_lbn_t, ufs2_daddr_t, int);
 static void err_suj(const char *, ...) __dead2;
 static void ino_trunc(ino_t, off_t);
 static void ino_decr(ino_t);
 static void ino_adjust(struct suj_ino *);
 static void ino_build(struct suj_ino *);
 static int blk_isfree(ufs2_daddr_t);
 static void initsuj(void);
 
 static void *
 errmalloc(size_t n)
 {
 	void *a;
 
 	a = Malloc(n);
 	if (a == NULL)
 		err(EX_OSERR, "malloc(%zu)", n);
 	return (a);
 }
 
 /*
  * When hit a fatal error in journalling check, print out
  * the error and then offer to fallback to normal fsck.
  */
 static void
 err_suj(const char * restrict fmt, ...)
 {
 	va_list ap;
 
 	if (preen)
 		(void)fprintf(stdout, "%s: ", cdevname);
 
 	va_start(ap, fmt);
 	(void)vfprintf(stdout, fmt, ap);
 	va_end(ap);
 
 	longjmp(jmpbuf, -1);
 }
 
 /*
  * Lookup a cg by number in the hash so we can keep track of which cgs
  * need stats rebuilt.
  */
 static struct suj_cg *
 cg_lookup(int cgx)
 {
 	struct cghd *hd;
 	struct suj_cg *sc;
 	struct bufarea *cgbp;
 
 	if (cgx < 0 || cgx >= fs->fs_ncg)
 		err_suj("Bad cg number %d\n", cgx);
 	if (lastcg && lastcg->sc_cgx == cgx)
 		return (lastcg);
 	cgbp = cglookup(cgx);
 	if (!check_cgmagic(cgx, cgbp, 0))
 		err_suj("UNABLE TO REBUILD CYLINDER GROUP %d", cgx);
 	hd = &cghash[HASH(cgx)];
 	LIST_FOREACH(sc, hd, sc_next)
 		if (sc->sc_cgx == cgx) {
 			sc->sc_cgbp = cgbp;
 			sc->sc_cgp = sc->sc_cgbp->b_un.b_cg;
 			lastcg = sc;
 			return (sc);
 		}
 	sc = errmalloc(sizeof(*sc));
 	bzero(sc, sizeof(*sc));
 	sc->sc_cgbp = cgbp;
 	sc->sc_cgp = sc->sc_cgbp->b_un.b_cg;
 	sc->sc_cgx = cgx;
 	LIST_INSERT_HEAD(hd, sc, sc_next);
 	return (sc);
 }
 
 /*
  * Lookup an inode number in the hash and allocate a suj_ino if it does
  * not exist.
  */
 static struct suj_ino *
 ino_lookup(ino_t ino, int creat)
 {
 	struct suj_ino *sino;
 	struct inohd *hd;
 	struct suj_cg *sc;
 
 	sc = cg_lookup(ino_to_cg(fs, ino));
 	if (sc->sc_lastino && sc->sc_lastino->si_ino == ino)
 		return (sc->sc_lastino);
 	hd = &sc->sc_inohash[HASH(ino)];
 	LIST_FOREACH(sino, hd, si_next)
 		if (sino->si_ino == ino)
 			return (sino);
 	if (creat == 0)
 		return (NULL);
 	sino = errmalloc(sizeof(*sino));
 	bzero(sino, sizeof(*sino));
 	sino->si_ino = ino;
 	TAILQ_INIT(&sino->si_recs);
 	TAILQ_INIT(&sino->si_newrecs);
 	TAILQ_INIT(&sino->si_movs);
 	LIST_INSERT_HEAD(hd, sino, si_next);
 
 	return (sino);
 }
 
 /*
  * Lookup a block number in the hash and allocate a suj_blk if it does
  * not exist.
  */
 static struct suj_blk *
 blk_lookup(ufs2_daddr_t blk, int creat)
 {
 	struct suj_blk *sblk;
 	struct suj_cg *sc;
 	struct blkhd *hd;
 
 	sc = cg_lookup(dtog(fs, blk));
 	if (sc->sc_lastblk && sc->sc_lastblk->sb_blk == blk)
 		return (sc->sc_lastblk);
 	hd = &sc->sc_blkhash[HASH(fragstoblks(fs, blk))];
 	LIST_FOREACH(sblk, hd, sb_next)
 		if (sblk->sb_blk == blk)
 			return (sblk);
 	if (creat == 0)
 		return (NULL);
 	sblk = errmalloc(sizeof(*sblk));
 	bzero(sblk, sizeof(*sblk));
 	sblk->sb_blk = blk;
 	TAILQ_INIT(&sblk->sb_recs);
 	LIST_INSERT_HEAD(hd, sblk, sb_next);
 
 	return (sblk);
 }
 
 static int
 blk_overlaps(struct jblkrec *brec, ufs2_daddr_t start, int frags)
 {
 	ufs2_daddr_t bstart;
 	ufs2_daddr_t bend;
 	ufs2_daddr_t end;
 
 	end = start + frags;
 	bstart = brec->jb_blkno + brec->jb_oldfrags;
 	bend = bstart + brec->jb_frags;
 	if (start < bend && end > bstart)
 		return (1);
 	return (0);
 }
 
 static int
 blk_equals(struct jblkrec *brec, ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t start,
     int frags)
 {
 
 	if (brec->jb_ino != ino || brec->jb_lbn != lbn)
 		return (0);
 	if (brec->jb_blkno + brec->jb_oldfrags != start)
 		return (0);
 	if (brec->jb_frags < frags)
 		return (0);
 	return (1);
 }
 
 static void
 blk_setmask(struct jblkrec *brec, int *mask)
 {
 	int i;
 
 	for (i = brec->jb_oldfrags; i < brec->jb_oldfrags + brec->jb_frags; i++)
 		*mask |= 1 << i;
 }
 
 /*
  * Determine whether a given block has been reallocated to a new location.
  * Returns a mask of overlapping bits if any frags have been reused or
  * zero if the block has not been re-used and the contents can be trusted.
  *
  * This is used to ensure that an orphaned pointer due to truncate is safe
  * to be freed.  The mask value can be used to free partial blocks.
  */
 static int
 blk_freemask(ufs2_daddr_t blk, ino_t ino, ufs_lbn_t lbn, int frags)
 {
 	struct suj_blk *sblk;
 	struct suj_rec *srec;
 	struct jblkrec *brec;
 	int mask;
 	int off;
 
 	/*
 	 * To be certain we're not freeing a reallocated block we lookup
 	 * this block in the blk hash and see if there is an allocation
 	 * journal record that overlaps with any fragments in the block
 	 * we're concerned with.  If any fragments have been reallocated
 	 * the block has already been freed and re-used for another purpose.
 	 */
 	mask = 0;
 	sblk = blk_lookup(blknum(fs, blk), 0);
 	if (sblk == NULL)
 		return (0);
 	off = blk - sblk->sb_blk;
 	TAILQ_FOREACH(srec, &sblk->sb_recs, sr_next) {
 		brec = (struct jblkrec *)srec->sr_rec;
 		/*
 		 * If the block overlaps but does not match
 		 * exactly this record refers to the current
 		 * location.
 		 */
 		if (blk_overlaps(brec, blk, frags) == 0)
 			continue;
 		if (blk_equals(brec, ino, lbn, blk, frags) == 1)
 			mask = 0;
 		else
 			blk_setmask(brec, &mask);
 	}
 	if (debug)
 		printf("blk_freemask: blk %jd sblk %jd off %d mask 0x%X\n",
 		    blk, sblk->sb_blk, off, mask);
 	return (mask >> off);
 }
 
 /*
  * Determine whether it is safe to follow an indirect.  It is not safe
  * if any part of the indirect has been reallocated or the last journal
  * entry was an allocation.  Just allocated indirects may not have valid
  * pointers yet and all of their children will have their own records.
  * It is also not safe to follow an indirect if the cg bitmap has been
  * cleared as a new allocation may write to the block prior to the journal
  * being written.
  *
  * Returns 1 if it's safe to follow the indirect and 0 otherwise.
  */
 static int
 blk_isindir(ufs2_daddr_t blk, ino_t ino, ufs_lbn_t lbn)
 {
 	struct suj_blk *sblk;
 	struct jblkrec *brec;
 
 	sblk = blk_lookup(blk, 0);
 	if (sblk == NULL)
 		return (1);
 	if (TAILQ_EMPTY(&sblk->sb_recs))
 		return (1);
 	brec = (struct jblkrec *)TAILQ_LAST(&sblk->sb_recs, srechd)->sr_rec;
 	if (blk_equals(brec, ino, lbn, blk, fs->fs_frag))
 		if (brec->jb_op == JOP_FREEBLK)
 			return (!blk_isfree(blk));
 	return (0);
 }
 
 /*
  * Check to see if the requested block is available.
  * We can just check in the cylinder-group maps as
  * they will only have usable blocks in them.
  */
 ufs2_daddr_t
-suj_checkblkavail(blkno, frags)
-	ufs2_daddr_t blkno;
-	long frags;
+suj_checkblkavail(ufs2_daddr_t blkno, long frags)
 {
 	struct bufarea *cgbp;
 	struct cg *cgp;
 	ufs2_daddr_t j, k, baseblk;
 	long cg;
 
 	if ((u_int64_t)blkno > sblock.fs_size)
 		return (0);
 	cg = dtog(&sblock, blkno);
 	cgbp = cglookup(cg);
 	cgp = cgbp->b_un.b_cg;
 	if (!check_cgmagic(cg, cgbp, 0))
 		return (-((cg + 1) * sblock.fs_fpg - sblock.fs_frag));
 	baseblk = dtogd(&sblock, blkno);
 	for (j = 0; j <= sblock.fs_frag - frags; j++) {
 		if (!isset(cg_blksfree(cgp), baseblk + j))
 			continue;
 		for (k = 1; k < frags; k++)
 			if (!isset(cg_blksfree(cgp), baseblk + j + k))
 				break;
 		if (k < frags) {
 			j += k;
 			continue;
 		}
 		for (k = 0; k < frags; k++)
 			clrbit(cg_blksfree(cgp), baseblk + j + k);
 		n_blks += frags;
 		if (frags == sblock.fs_frag)
 			cgp->cg_cs.cs_nbfree--;
 		else
 			cgp->cg_cs.cs_nffree -= frags;
 		cgdirty(cgbp);
 		return ((cg * sblock.fs_fpg) + baseblk + j);
 	}
 	return (0);
 }
 
 /*
  * Clear an inode from the cg bitmap.  If the inode was already clear return
  * 0 so the caller knows it does not have to check the inode contents.
  */
 static int
 ino_free(ino_t ino, int mode)
 {
 	struct suj_cg *sc;
 	uint8_t *inosused;
 	struct cg *cgp;
 	int cg;
 
 	cg = ino_to_cg(fs, ino);
 	ino = ino % fs->fs_ipg;
 	sc = cg_lookup(cg);
 	cgp = sc->sc_cgp;
 	inosused = cg_inosused(cgp);
 	/*
 	 * The bitmap may never have made it to the disk so we have to
 	 * conditionally clear.  We can avoid writing the cg in this case.
 	 */
 	if (isclr(inosused, ino))
 		return (0);
 	freeinos++;
 	clrbit(inosused, ino);
 	if (ino < cgp->cg_irotor)
 		cgp->cg_irotor = ino;
 	cgp->cg_cs.cs_nifree++;
 	if ((mode & IFMT) == IFDIR) {
 		freedir++;
 		cgp->cg_cs.cs_ndir--;
 	}
 	cgdirty(sc->sc_cgbp);
 
 	return (1);
 }
 
 /*
  * Free 'frags' frags starting at filesystem block 'bno' skipping any frags
  * set in the mask.
  */
 static void
 blk_free(ino_t ino, ufs2_daddr_t bno, int mask, int frags)
 {
 	ufs1_daddr_t fragno, cgbno;
 	struct suj_cg *sc;
 	struct cg *cgp;
 	int i, cg;
 	uint8_t *blksfree;
 
 	if (debug)
 		printf("Freeing %d frags at blk %jd mask 0x%x\n",
 		    frags, bno, mask);
 	/*
 	 * Check to see if the block needs to be claimed by a snapshot.
 	 * If wanted, the snapshot references it. Otherwise we free it.
 	 */
 	if (snapblkfree(fs, bno, lfragtosize(fs, frags), ino,
 	    suj_checkblkavail))
 		return;
 	cg = dtog(fs, bno);
 	sc = cg_lookup(cg);
 	cgp = sc->sc_cgp;
 	cgbno = dtogd(fs, bno);
 	blksfree = cg_blksfree(cgp);
 
 	/*
 	 * If it's not allocated we only wrote the journal entry
 	 * and never the bitmaps.  Here we unconditionally clear and
 	 * resolve the cg summary later.
 	 */
 	if (frags == fs->fs_frag && mask == 0) {
 		fragno = fragstoblks(fs, cgbno);
 		ffs_setblock(fs, blksfree, fragno);
 		freeblocks++;
 	} else {
 		/*
 		 * deallocate the fragment
 		 */
 		for (i = 0; i < frags; i++)
 			if ((mask & (1 << i)) == 0 && isclr(blksfree, cgbno +i)) {
 				freefrags++;
 				setbit(blksfree, cgbno + i);
 			}
 	}
 	cgdirty(sc->sc_cgbp);
 }
 
 /*
  * Returns 1 if the whole block starting at 'bno' is marked free and 0
  * otherwise.
  */
 static int
 blk_isfree(ufs2_daddr_t bno)
 {
 	struct suj_cg *sc;
 
 	sc = cg_lookup(dtog(fs, bno));
 	return ffs_isblock(fs, cg_blksfree(sc->sc_cgp), dtogd(fs, bno));
 }
 
 /*
  * Determine whether a block exists at a particular lbn in an inode.
  * Returns 1 if found, 0 if not.  lbn may be negative for indirects
  * or ext blocks.
  */
 static int
 blk_isat(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, int *frags)
 {
 	struct inode ip;
 	union dinode *dp;
 	ufs2_daddr_t nblk;
 
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	if (DIP(dp, di_nlink) == 0 || DIP(dp, di_mode) == 0) {
 		irelse(&ip);
 		return (0);
 	}
 	nblk = ino_blkatoff(dp, ino, lbn, frags, NULL);
 	irelse(&ip);
 	return (nblk == blk);
 }
 
 /*
  * Clear the directory entry at diroff that should point to child.  Minimal
  * checking is done and it is assumed that this path was verified with isat.
  */
 static void
 ino_clrat(ino_t parent, off_t diroff, ino_t child)
 {
 	union dinode *dip;
 	struct direct *dp;
 	struct inode ip;
 	ufs2_daddr_t blk;
 	struct bufarea *bp;
 	ufs_lbn_t lbn;
 	int blksize;
 	int frags;
 	int doff;
 
 	if (debug)
 		printf("Clearing inode %ju from parent %ju at offset %jd\n",
 		    (uintmax_t)child, (uintmax_t)parent, diroff);
 
 	lbn = lblkno(fs, diroff);
 	doff = blkoff(fs, diroff);
 	ginode(parent, &ip);
 	dip = ip.i_dp;
 	blk = ino_blkatoff(dip, parent, lbn, &frags, NULL);
 	blksize = sblksize(fs, DIP(dip, di_size), lbn);
 	irelse(&ip);
 	bp = getdatablk(blk, blksize, BT_DIRDATA);
 	if (bp->b_errs != 0)
 		err_suj("ino_clrat: UNRECOVERABLE I/O ERROR");
 	dp = (struct direct *)&bp->b_un.b_buf[doff];
 	if (dp->d_ino != child)
 		errx(1, "Inode %ju does not exist in %ju at %jd",
 		    (uintmax_t)child, (uintmax_t)parent, diroff);
 	dp->d_ino = 0;
 	dirty(bp);
 	brelse(bp);
 	/*
 	 * The actual .. reference count will already have been removed
 	 * from the parent by the .. remref record.
 	 */
 }
 
 /*
  * Determines whether a pointer to an inode exists within a directory
  * at a specified offset.  Returns the mode of the found entry.
  */
 static int
 ino_isat(ino_t parent, off_t diroff, ino_t child, int *mode, int *isdot)
 {
 	struct inode ip;
 	union dinode *dip;
 	struct bufarea *bp;
 	struct direct *dp;
 	ufs2_daddr_t blk;
 	ufs_lbn_t lbn;
 	int blksize;
 	int frags;
 	int dpoff;
 	int doff;
 
 	*isdot = 0;
 	ginode(parent, &ip);
 	dip = ip.i_dp;
 	*mode = DIP(dip, di_mode);
 	if ((*mode & IFMT) != IFDIR) {
 		if (debug) {
 			/*
 			 * This can happen if the parent inode
 			 * was reallocated.
 			 */
 			if (*mode != 0)
 				printf("Directory %ju has bad mode %o\n",
 				    (uintmax_t)parent, *mode);
 			else
 				printf("Directory %ju has zero mode\n",
 				    (uintmax_t)parent);
 		}
 		irelse(&ip);
 		return (0);
 	}
 	lbn = lblkno(fs, diroff);
 	doff = blkoff(fs, diroff);
 	blksize = sblksize(fs, DIP(dip, di_size), lbn);
 	if (diroff + DIRECTSIZ(1) > DIP(dip, di_size) || doff >= blksize) {
 		if (debug)
 			printf("ino %ju absent from %ju due to offset %jd"
 			    " exceeding size %jd\n",
 			    (uintmax_t)child, (uintmax_t)parent, diroff,
 			    DIP(dip, di_size));
 		irelse(&ip);
 		return (0);
 	}
 	blk = ino_blkatoff(dip, parent, lbn, &frags, NULL);
 	irelse(&ip);
 	if (blk <= 0) {
 		if (debug)
 			printf("Sparse directory %ju", (uintmax_t)parent);
 		return (0);
 	}
 	bp = getdatablk(blk, blksize, BT_DIRDATA);
 	if (bp->b_errs != 0)
 		err_suj("ino_isat: UNRECOVERABLE I/O ERROR");
 	/*
 	 * Walk through the records from the start of the block to be
 	 * certain we hit a valid record and not some junk in the middle
 	 * of a file name.  Stop when we reach or pass the expected offset.
 	 */
 	dpoff = rounddown(doff, DIRBLKSIZ);
 	do {
 		dp = (struct direct *)&bp->b_un.b_buf[dpoff];
 		if (dpoff == doff)
 			break;
 		if (dp->d_reclen == 0)
 			break;
 		dpoff += dp->d_reclen;
 	} while (dpoff <= doff);
 	if (dpoff > fs->fs_bsize)
 		err_suj("Corrupt directory block in dir ino %ju\n",
 		    (uintmax_t)parent);
 	/* Not found. */
 	if (dpoff != doff) {
 		if (debug)
 			printf("ino %ju not found in %ju, lbn %jd, dpoff %d\n",
 			    (uintmax_t)child, (uintmax_t)parent, lbn, dpoff);
 		brelse(bp);
 		return (0);
 	}
 	/*
 	 * We found the item in question.  Record the mode and whether it's
 	 * a . or .. link for the caller.
 	 */
 	if (dp->d_ino == child) {
 		if (child == parent)
 			*isdot = 1;
 		else if (dp->d_namlen == 2 &&
 		    dp->d_name[0] == '.' && dp->d_name[1] == '.')
 			*isdot = 1;
 		*mode = DTTOIF(dp->d_type);
 		brelse(bp);
 		return (1);
 	}
 	if (debug)
 		printf("ino %ju doesn't match dirent ino %ju in parent %ju\n",
 		    (uintmax_t)child, (uintmax_t)dp->d_ino, (uintmax_t)parent);
 	brelse(bp);
 	return (0);
 }
 
 #define	VISIT_INDIR	0x0001
 #define	VISIT_EXT	0x0002
 #define	VISIT_ROOT	0x0004	/* Operation came via root & valid pointers. */
 
 /*
  * Read an indirect level which may or may not be linked into an inode.
  */
 static void
 indir_visit(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, uint64_t *frags,
     ino_visitor visitor, int flags)
 {
 	struct bufarea *bp;
 	ufs_lbn_t lbnadd;
 	ufs2_daddr_t nblk;
 	ufs_lbn_t nlbn;
 	int level;
 	int i;
 
 	/*
 	 * Don't visit indirect blocks with contents we can't trust.  This
 	 * should only happen when indir_visit() is called to complete a
 	 * truncate that never finished and not when a pointer is found via
 	 * an inode.
 	 */
 	if (blk == 0)
 		return;
 	level = lbn_level(lbn);
 	if (level == -1)
 		err_suj("Invalid level for lbn %jd\n", lbn);
 	if ((flags & VISIT_ROOT) == 0 && blk_isindir(blk, ino, lbn) == 0) {
 		if (debug)
 			printf("blk %jd ino %ju lbn %jd(%d) is not indir.\n",
 			    blk, (uintmax_t)ino, lbn, level);
 		goto out;
 	}
 	lbnadd = 1;
 	for (i = level; i > 0; i--)
 		lbnadd *= NINDIR(fs);
 	bp = getdatablk(blk, fs->fs_bsize, BT_LEVEL1 + level);
 	if (bp->b_errs != 0)
 		err_suj("indir_visit: UNRECOVERABLE I/O ERROR");
 	for (i = 0; i < NINDIR(fs); i++) {
 		if ((nblk = IBLK(bp, i)) == 0)
 			continue;
 		if (level == 0) {
 			nlbn = -lbn + i * lbnadd;
 			(*frags) += fs->fs_frag;
 			visitor(ino, nlbn, nblk, fs->fs_frag);
 		} else {
 			nlbn = (lbn + 1) - (i * lbnadd);
 			indir_visit(ino, nlbn, nblk, frags, visitor, flags);
 		}
 	}
 	brelse(bp);
 out:
 	if (flags & VISIT_INDIR) {
 		(*frags) += fs->fs_frag;
 		visitor(ino, lbn, blk, fs->fs_frag);
 	}
 }
 
 /*
  * Visit each block in an inode as specified by 'flags' and call a
  * callback function.  The callback may inspect or free blocks.  The
  * count of frags found according to the size in the file is returned.
  * This is not valid for sparse files but may be used to determine
  * the correct di_blocks for a file.
  */
 static uint64_t
 ino_visit(union dinode *dp, ino_t ino, ino_visitor visitor, int flags)
 {
 	ufs_lbn_t nextlbn;
 	ufs_lbn_t tmpval;
 	ufs_lbn_t lbn;
 	uint64_t size;
 	uint64_t fragcnt;
 	int mode;
 	int frags;
 	int i;
 
 	size = DIP(dp, di_size);
 	mode = DIP(dp, di_mode) & IFMT;
 	fragcnt = 0;
 	if ((flags & VISIT_EXT) &&
 	    fs->fs_magic == FS_UFS2_MAGIC && dp->dp2.di_extsize) {
 		for (i = 0; i < UFS_NXADDR; i++) {
 			if (dp->dp2.di_extb[i] == 0)
 				continue;
 			frags = sblksize(fs, dp->dp2.di_extsize, i);
 			frags = numfrags(fs, frags);
 			fragcnt += frags;
 			visitor(ino, -1 - i, dp->dp2.di_extb[i], frags);
 		}
 	}
 	/* Skip datablocks for short links and devices. */
 	if (mode == IFBLK || mode == IFCHR ||
 	    (mode == IFLNK && size < fs->fs_maxsymlinklen))
 		return (fragcnt);
 	for (i = 0; i < UFS_NDADDR; i++) {
 		if (DIP(dp, di_db[i]) == 0)
 			continue;
 		frags = sblksize(fs, size, i);
 		frags = numfrags(fs, frags);
 		fragcnt += frags;
 		visitor(ino, i, DIP(dp, di_db[i]), frags);
 	}
 	/*
 	 * We know the following indirects are real as we're following
 	 * real pointers to them.
 	 */
 	flags |= VISIT_ROOT;
 	for (i = 0, tmpval = NINDIR(fs), lbn = UFS_NDADDR; i < UFS_NIADDR; i++,
 	    lbn = nextlbn) {
 		nextlbn = lbn + tmpval;
 		tmpval *= NINDIR(fs);
 		if (DIP(dp, di_ib[i]) == 0)
 			continue;
 		indir_visit(ino, -lbn - i, DIP(dp, di_ib[i]), &fragcnt, visitor,
 		    flags);
 	}
 	return (fragcnt);
 }
 
 /*
  * Null visitor function used when we just want to count blocks and
  * record the lbn.
  */
 ufs_lbn_t visitlbn;
 static void
 null_visit(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, int frags)
 {
 	if (lbn > 0)
 		visitlbn = lbn;
 }
 
 /*
  * Recalculate di_blocks when we discover that a block allocation or
  * free was not successfully completed.  The kernel does not roll this back
  * because it would be too expensive to compute which indirects were
  * reachable at the time the inode was written.
  */
 static void
 ino_adjblks(struct suj_ino *sino)
 {
 	struct inode ip;
 	union dinode *dp;
 	uint64_t blocks;
 	uint64_t frags;
 	off_t isize;
 	off_t size;
 	ino_t ino;
 
 	ino = sino->si_ino;
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	/* No need to adjust zero'd inodes. */
 	if (DIP(dp, di_mode) == 0) {
 		irelse(&ip);
 		return;
 	}
 	/*
 	 * Visit all blocks and count them as well as recording the last
 	 * valid lbn in the file.  If the file size doesn't agree with the
 	 * last lbn we need to truncate to fix it.  Otherwise just adjust
 	 * the blocks count.
 	 */
 	visitlbn = 0;
 	frags = ino_visit(dp, ino, null_visit, VISIT_INDIR | VISIT_EXT);
 	blocks = fsbtodb(fs, frags);
 	/*
 	 * We assume the size and direct block list is kept coherent by
 	 * softdep.  For files that have extended into indirects we truncate
 	 * to the size in the inode or the maximum size permitted by
 	 * populated indirects.
 	 */
 	if (visitlbn >= UFS_NDADDR) {
 		isize = DIP(dp, di_size);
 		size = lblktosize(fs, visitlbn + 1);
 		if (isize > size)
 			isize = size;
 		/* Always truncate to free any unpopulated indirects. */
 		ino_trunc(ino, isize);
 		irelse(&ip);
 		return;
 	}
 	if (blocks == DIP(dp, di_blocks)) {
 		irelse(&ip);
 		return;
 	}
 	if (debug)
 		printf("ino %ju adjusting block count from %jd to %jd\n",
 		    (uintmax_t)ino, DIP(dp, di_blocks), blocks);
 	DIP_SET(dp, di_blocks, blocks);
 	inodirty(&ip);
 	irelse(&ip);
 }
 
 static void
 blk_free_visit(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, int frags)
 {
 
 	blk_free(ino, blk, blk_freemask(blk, ino, lbn, frags), frags);
 }
 
 /*
  * Free a block or tree of blocks that was previously rooted in ino at
  * the given lbn.  If the lbn is an indirect all children are freed
  * recursively.
  */
 static void
 blk_free_lbn(ufs2_daddr_t blk, ino_t ino, ufs_lbn_t lbn, int frags, int follow)
 {
 	uint64_t resid;
 	int mask;
 
 	mask = blk_freemask(blk, ino, lbn, frags);
 	resid = 0;
 	if (lbn <= -UFS_NDADDR && follow && mask == 0)
 		indir_visit(ino, lbn, blk, &resid, blk_free_visit, VISIT_INDIR);
 	else
 		blk_free(ino, blk, mask, frags);
 }
 
 static void
 ino_setskip(struct suj_ino *sino, ino_t parent)
 {
 	int isdot;
 	int mode;
 
 	if (ino_isat(sino->si_ino, DOTDOT_OFFSET, parent, &mode, &isdot))
 		sino->si_skipparent = 1;
 }
 
 static void
 ino_remref(ino_t parent, ino_t child, uint64_t diroff, int isdotdot)
 {
 	struct suj_ino *sino;
 	struct suj_rec *srec;
 	struct jrefrec *rrec;
 
 	/*
 	 * Lookup this inode to see if we have a record for it.
 	 */
 	sino = ino_lookup(child, 0);
 	/*
 	 * Tell any child directories we've already removed their
 	 * parent link cnt.  Don't try to adjust our link down again.
 	 */
 	if (sino != NULL && isdotdot == 0)
 		ino_setskip(sino, parent);
 	/*
 	 * No valid record for this inode.  Just drop the on-disk
 	 * link by one.
 	 */
 	if (sino == NULL || sino->si_hasrecs == 0) {
 		ino_decr(child);
 		return;
 	}
 	/*
 	 * Use ino_adjust() if ino_check() has already processed this
 	 * child.  If we lose the last non-dot reference to a
 	 * directory it will be discarded.
 	 */
 	if (sino->si_linkadj) {
 		if (sino->si_nlink == 0)
 			err_suj("ino_remref: ino %ld mode 0%o about to go "
 			    "negative\n", sino->si_ino, sino->si_mode);
 		sino->si_nlink--;
 		if (isdotdot)
 			sino->si_dotlinks--;
 		ino_adjust(sino);
 		return;
 	}
 	/*
 	 * If we haven't yet processed this inode we need to make
 	 * sure we will successfully discover the lost path.  If not
 	 * use nlinkadj to remember.
 	 */
 	TAILQ_FOREACH(srec, &sino->si_recs, sr_next) {
 		rrec = (struct jrefrec *)srec->sr_rec;
 		if (rrec->jr_parent == parent &&
 		    rrec->jr_diroff == diroff)
 			return;
 	}
 	sino->si_nlinkadj++;
 }
 
 /*
  * Free the children of a directory when the directory is discarded.
  */
 static void
 ino_free_children(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, int frags)
 {
 	struct suj_ino *sino;
 	struct bufarea *bp;
 	struct direct *dp;
 	off_t diroff;
 	int skipparent;
 	int isdotdot;
 	int dpoff;
 	int size;
 
 	sino = ino_lookup(ino, 0);
 	if (sino)
 		skipparent = sino->si_skipparent;
 	else
 		skipparent = 0;
 	size = lfragtosize(fs, frags);
 	bp = getdatablk(blk, size, BT_DIRDATA);
 	if (bp->b_errs != 0)
 		err_suj("ino_free_children: UNRECOVERABLE I/O ERROR");
 	dp = (struct direct *)&bp->b_un.b_buf[0];
 	for (dpoff = 0; dpoff < size && dp->d_reclen; dpoff += dp->d_reclen) {
 		dp = (struct direct *)&bp->b_un.b_buf[dpoff];
 		if (dp->d_ino == 0 || dp->d_ino == UFS_WINO)
 			continue;
 		if (dp->d_namlen == 1 && dp->d_name[0] == '.')
 			continue;
 		isdotdot = dp->d_namlen == 2 && dp->d_name[0] == '.' &&
 		    dp->d_name[1] == '.';
 		if (isdotdot && skipparent == 1)
 			continue;
 		if (debug)
 			printf("Directory %ju removing ino %ju name %s\n",
 			    (uintmax_t)ino, (uintmax_t)dp->d_ino, dp->d_name);
 		diroff = lblktosize(fs, lbn) + dpoff;
 		ino_remref(ino, dp->d_ino, diroff, isdotdot);
 	}
 	brelse(bp);
 }
 
 /*
  * Reclaim an inode, freeing all blocks and decrementing all children's
  * link counts.  Free the inode back to the cg.
  */
 static void
 ino_reclaim(struct inode *ip, ino_t ino, int mode)
 {
 	union dinode *dp;
 	uint32_t gen;
 
 	dp = ip->i_dp;
 	if (ino == UFS_ROOTINO)
 		err_suj("Attempting to free UFS_ROOTINO\n");
 	if (debug)
 		printf("Truncating and freeing ino %ju, nlink %d, mode %o\n",
 		    (uintmax_t)ino, DIP(dp, di_nlink), DIP(dp, di_mode));
 
 	/* We are freeing an inode or directory. */
 	if ((DIP(dp, di_mode) & IFMT) == IFDIR)
 		ino_visit(dp, ino, ino_free_children, 0);
 	DIP_SET(dp, di_nlink, 0);
 	if ((DIP(dp, di_flags) & SF_SNAPSHOT) != 0)
 		snapremove(ino);
 	ino_visit(dp, ino, blk_free_visit, VISIT_EXT | VISIT_INDIR);
 	/* Here we have to clear the inode and release any blocks it holds. */
 	gen = DIP(dp, di_gen);
 	if (fs->fs_magic == FS_UFS1_MAGIC)
 		bzero(dp, sizeof(struct ufs1_dinode));
 	else
 		bzero(dp, sizeof(struct ufs2_dinode));
 	DIP_SET(dp, di_gen, gen);
 	inodirty(ip);
 	ino_free(ino, mode);
 	return;
 }
 
 /*
  * Adjust an inode's link count down by one when a directory goes away.
  */
 static void
 ino_decr(ino_t ino)
 {
 	struct inode ip;
 	union dinode *dp;
 	int reqlink;
 	int nlink;
 	int mode;
 
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	nlink = DIP(dp, di_nlink);
 	mode = DIP(dp, di_mode);
 	if (nlink < 1)
 		err_suj("Inode %d link count %d invalid\n", ino, nlink);
 	if (mode == 0)
 		err_suj("Inode %d has a link of %d with 0 mode\n", ino, nlink);
 	nlink--;
 	if ((mode & IFMT) == IFDIR)
 		reqlink = 2;
 	else
 		reqlink = 1;
 	if (nlink < reqlink) {
 		if (debug)
 			printf("ino %ju not enough links to live %d < %d\n",
 			    (uintmax_t)ino, nlink, reqlink);
 		ino_reclaim(&ip, ino, mode);
 		irelse(&ip);
 		return;
 	}
 	DIP_SET(dp, di_nlink, nlink);
 	inodirty(&ip);
 	irelse(&ip);
 }
 
 /*
  * Adjust the inode link count to 'nlink'.  If the count reaches zero
  * free it.
  */
 static void
 ino_adjust(struct suj_ino *sino)
 {
 	struct jrefrec *rrec;
 	struct suj_rec *srec;
 	struct suj_ino *stmp;
 	union dinode *dp;
 	struct inode ip;
 	nlink_t nlink;
 	nlink_t reqlink;
 	int recmode;
 	int isdot;
 	int mode;
 	ino_t ino;
 
 	nlink = sino->si_nlink;
 	ino = sino->si_ino;
 	mode = sino->si_mode & IFMT;
 	/*
 	 * If it's a directory with no dot links, it was truncated before
 	 * the name was cleared.  We need to clear the dirent that
 	 * points at it.
 	 */
 	if (mode == IFDIR && nlink == 1 && sino->si_dotlinks == 0) {
 		sino->si_nlink = nlink = 0;
 		TAILQ_FOREACH(srec, &sino->si_recs, sr_next) {
 			rrec = (struct jrefrec *)srec->sr_rec;
 			if (ino_isat(rrec->jr_parent, rrec->jr_diroff, ino,
 			    &recmode, &isdot) == 0)
 				continue;
 			ino_clrat(rrec->jr_parent, rrec->jr_diroff, ino);
 			break;
 		}
 		if (srec == NULL)
 			errx(1, "Directory %ju name not found", (uintmax_t)ino);
 	}
 	/*
 	 * If it's a directory with no real names pointing to it go ahead
 	 * and truncate it.  This will free any children.
 	 */
 	if (mode == IFDIR && nlink - sino->si_dotlinks == 0) {
 		sino->si_nlink = nlink = 0;
 		/*
 		 * Mark any .. links so they know not to free this inode
 		 * when they are removed.
 		 */
 		TAILQ_FOREACH(srec, &sino->si_recs, sr_next) {
 			rrec = (struct jrefrec *)srec->sr_rec;
 			if (rrec->jr_diroff == DOTDOT_OFFSET) {
 				stmp = ino_lookup(rrec->jr_parent, 0);
 				if (stmp)
 					ino_setskip(stmp, ino);
 			}
 		}
 	}
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	mode = DIP(dp, di_mode) & IFMT;
 	if (nlink > UFS_LINK_MAX)
 		err_suj("ino %ju nlink manipulation error, new %ju, old %d\n",
 		    (uintmax_t)ino, (uintmax_t)nlink, DIP(dp, di_nlink));
 	if (debug)
 	       printf("Adjusting ino %ju, nlink %ju, old link %d lastmode %o\n",
 		    (uintmax_t)ino, (uintmax_t)nlink, DIP(dp, di_nlink),
 		    sino->si_mode);
 	if (mode == 0) {
 		if (debug)
 			printf("ino %ju, zero inode freeing bitmap\n",
 			    (uintmax_t)ino);
 		ino_free(ino, sino->si_mode);
 		irelse(&ip);
 		return;
 	}
 	/* XXX Should be an assert? */
 	if (mode != sino->si_mode && debug)
 		printf("ino %ju, mode %o != %o\n",
 		    (uintmax_t)ino, mode, sino->si_mode);
 	if ((mode & IFMT) == IFDIR)
 		reqlink = 2;
 	else
 		reqlink = 1;
 	/* If the inode doesn't have enough links to live, free it. */
 	if (nlink < reqlink) {
 		if (debug)
 			printf("ino %ju not enough links to live %ju < %ju\n",
 			    (uintmax_t)ino, (uintmax_t)nlink,
 			    (uintmax_t)reqlink);
 		ino_reclaim(&ip, ino, mode);
 		irelse(&ip);
 		return;
 	}
 	/* If required write the updated link count. */
 	if (DIP(dp, di_nlink) == nlink) {
 		if (debug)
 			printf("ino %ju, link matches, skipping.\n",
 			    (uintmax_t)ino);
 		irelse(&ip);
 		return;
 	}
 	DIP_SET(dp, di_nlink, nlink);
 	inodirty(&ip);
 	irelse(&ip);
 }
 
 /*
  * Truncate some or all blocks in an indirect, freeing any that are required
  * and zeroing the indirect.
  */
 static void
 indir_trunc(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, ufs_lbn_t lastlbn,
 	union dinode *dp)
 {
 	struct bufarea *bp;
 	ufs_lbn_t lbnadd;
 	ufs2_daddr_t nblk;
 	ufs_lbn_t next;
 	ufs_lbn_t nlbn;
 	int isdirty;
 	int level;
 	int i;
 
 	if (blk == 0)
 		return;
 	isdirty = 0;
 	level = lbn_level(lbn);
 	if (level == -1)
 		err_suj("Invalid level for lbn %jd\n", lbn);
 	lbnadd = 1;
 	for (i = level; i > 0; i--)
 		lbnadd *= NINDIR(fs);
 	bp = getdatablk(blk, fs->fs_bsize, BT_LEVEL1 + level);
 	if (bp->b_errs != 0)
 		err_suj("indir_trunc: UNRECOVERABLE I/O ERROR");
 	for (i = 0; i < NINDIR(fs); i++) {
 		if ((nblk = IBLK(bp, i)) == 0)
 			continue;
 		if (level != 0) {
 			nlbn = (lbn + 1) - (i * lbnadd);
 			/*
 			 * Calculate the lbn of the next indirect to
 			 * determine if any of this indirect must be
 			 * reclaimed.
 			 */
 			next = -(lbn + level) + ((i+1) * lbnadd);
 			if (next <= lastlbn)
 				continue;
 			indir_trunc(ino, nlbn, nblk, lastlbn, dp);
 			/* If all of this indirect was reclaimed, free it. */
 			nlbn = next - lbnadd;
 			if (nlbn < lastlbn)
 				continue;
 		} else {
 			nlbn = -lbn + i * lbnadd;
 			if (nlbn < lastlbn)
 				continue;
 		}
 		isdirty = 1;
 		blk_free(ino, nblk, 0, fs->fs_frag);
 		IBLK_SET(bp, i, 0);
 	}
 	if (isdirty)
 		dirty(bp);
 	brelse(bp);
 }
 
 /*
  * Truncate an inode to the minimum of the given size or the last populated
  * block after any over size have been discarded.  The kernel would allocate
  * the last block in the file but fsck does not and neither do we.  This
  * code never extends files, only shrinks them.
  */
 static void
 ino_trunc(ino_t ino, off_t size)
 {
 	struct inode ip;
 	union dinode *dp;
 	struct bufarea *bp;
 	ufs2_daddr_t bn;
 	uint64_t totalfrags;
 	ufs_lbn_t nextlbn;
 	ufs_lbn_t lastlbn;
 	ufs_lbn_t tmpval;
 	ufs_lbn_t lbn;
 	ufs_lbn_t i;
 	int blksize, frags;
 	off_t cursize;
 	off_t off;
 	int mode;
 
 	ginode(ino, &ip);
 	dp = ip.i_dp;
 	mode = DIP(dp, di_mode) & IFMT;
 	cursize = DIP(dp, di_size);
 	/* If no size change, nothing to do */
 	if (size == cursize) {
 		irelse(&ip);
 		return;
 	}
 	if (debug)
 		printf("Truncating ino %ju, mode %o to size %jd from size %jd\n",
 		    (uintmax_t)ino, mode, size, cursize);
 
 	/* Skip datablocks for short links and devices. */
 	if (mode == 0 || mode == IFBLK || mode == IFCHR ||
 	    (mode == IFLNK && cursize < fs->fs_maxsymlinklen)) {
 		irelse(&ip);
 		return;
 	}
 	/* Don't extend. */
 	if (size > cursize) {
 		irelse(&ip);
 		return;
 	}
 	if ((DIP(dp, di_flags) & SF_SNAPSHOT) != 0) {
 		if (size > 0)
 			err_suj("Partial truncation of ino %ju snapshot file\n",
 			    (uintmax_t)ino);
 		snapremove(ino);
 	}
 	lastlbn = lblkno(fs, blkroundup(fs, size));
 	for (i = lastlbn; i < UFS_NDADDR; i++) {
 		if ((bn = DIP(dp, di_db[i])) == 0)
 			continue;
 		blksize = sblksize(fs, cursize, i);
 		blk_free(ino, bn, 0, numfrags(fs, blksize));
 		DIP_SET(dp, di_db[i], 0);
 	}
 	/*
 	 * Follow indirect blocks, freeing anything required.
 	 */
 	for (i = 0, tmpval = NINDIR(fs), lbn = UFS_NDADDR; i < UFS_NIADDR; i++,
 	    lbn = nextlbn) {
 		nextlbn = lbn + tmpval;
 		tmpval *= NINDIR(fs);
 		/* If we're not freeing any in this indirect range skip it. */
 		if (lastlbn >= nextlbn)
 			continue;
 		if ((bn = DIP(dp, di_ib[i])) == 0)
   			continue;
 		indir_trunc(ino, -lbn - i, bn, lastlbn, dp);
   		/* If we freed everything in this indirect free the indir. */
   		if (lastlbn > lbn)
   			continue;
 		blk_free(ino, bn, 0, fs->fs_frag);
 		DIP_SET(dp, di_ib[i], 0);
 	}
 	/*
 	 * Now that we've freed any whole blocks that exceed the desired
 	 * truncation size, figure out how many blocks remain and what the
 	 * last populated lbn is.  We will set the size to this last lbn
 	 * rather than worrying about allocating the final lbn as the kernel
 	 * would've done.  This is consistent with normal fsck behavior.
 	 */
 	visitlbn = 0;
 	totalfrags = ino_visit(dp, ino, null_visit, VISIT_INDIR | VISIT_EXT);
 	if (size > lblktosize(fs, visitlbn + 1))
 		size = lblktosize(fs, visitlbn + 1);
 	/*
 	 * If we're truncating direct blocks we have to adjust frags
 	 * accordingly.
 	 */
 	if (visitlbn < UFS_NDADDR && totalfrags) {
 		long oldspace, newspace;
 
 		bn = DIP(dp, di_db[visitlbn]);
 		if (bn == 0)
 			err_suj("Bad blk at ino %ju lbn %jd\n",
 			    (uintmax_t)ino, visitlbn);
 		oldspace = sblksize(fs, cursize, visitlbn);
 		newspace = sblksize(fs, size, visitlbn);
 		if (oldspace != newspace) {
 			bn += numfrags(fs, newspace);
 			frags = numfrags(fs, oldspace - newspace);
 			blk_free(ino, bn, 0, frags);
 			totalfrags -= frags;
 		}
 	}
 	DIP_SET(dp, di_blocks, fsbtodb(fs, totalfrags));
 	DIP_SET(dp, di_size, size);
 	inodirty(&ip);
 	/*
 	 * If we've truncated into the middle of a block or frag we have
 	 * to zero it here.  Otherwise the file could extend into
 	 * uninitialized space later.
 	 */
 	off = blkoff(fs, size);
 	if (off && DIP(dp, di_mode) != IFDIR) {
 		long clrsize;
 
 		bn = ino_blkatoff(dp, ino, visitlbn, &frags, NULL);
 		if (bn == 0)
 			err_suj("Block missing from ino %ju at lbn %jd\n",
 			    (uintmax_t)ino, visitlbn);
 		clrsize = frags * fs->fs_fsize;
 		bp = getdatablk(bn, clrsize, BT_DATA);
 		if (bp->b_errs != 0)
 			err_suj("ino_trunc: UNRECOVERABLE I/O ERROR");
 		clrsize -= off;
 		bzero(&bp->b_un.b_buf[off], clrsize);
 		dirty(bp);
 		brelse(bp);
 	}
 	irelse(&ip);
 	return;
 }
 
 /*
  * Process records available for one inode and determine whether the
  * link count is correct or needs adjusting.
  */
 static void
 ino_check(struct suj_ino *sino)
 {
 	struct suj_rec *srec;
 	struct jrefrec *rrec;
 	nlink_t dotlinks;
 	nlink_t newlinks;
 	nlink_t removes;
 	nlink_t nlink;
 	ino_t ino;
 	int isdot;
 	int isat;
 	int mode;
 
 	if (sino->si_hasrecs == 0)
 		return;
 	ino = sino->si_ino;
 	rrec = (struct jrefrec *)TAILQ_FIRST(&sino->si_recs)->sr_rec;
 	nlink = rrec->jr_nlink;
 	newlinks = 0;
 	dotlinks = 0;
 	removes = sino->si_nlinkadj;
 	TAILQ_FOREACH(srec, &sino->si_recs, sr_next) {
 		rrec = (struct jrefrec *)srec->sr_rec;
 		isat = ino_isat(rrec->jr_parent, rrec->jr_diroff,
 		    rrec->jr_ino, &mode, &isdot);
 		if (isat && (mode & IFMT) != (rrec->jr_mode & IFMT))
 			err_suj("Inode mode/directory type mismatch %o != %o\n",
 			    mode, rrec->jr_mode);
 		if (debug)
 			printf("jrefrec: op %d ino %ju, nlink %ju, parent %ju, "
 			    "diroff %jd, mode %o, isat %d, isdot %d\n",
 			    rrec->jr_op, (uintmax_t)rrec->jr_ino,
 			    (uintmax_t)rrec->jr_nlink,
 			    (uintmax_t)rrec->jr_parent,
 			    (uintmax_t)rrec->jr_diroff,
 			    rrec->jr_mode, isat, isdot);
 		mode = rrec->jr_mode & IFMT;
 		if (rrec->jr_op == JOP_REMREF)
 			removes++;
 		newlinks += isat;
 		if (isdot)
 			dotlinks += isat;
 	}
 	/*
 	 * The number of links that remain are the starting link count
 	 * subtracted by the total number of removes with the total
 	 * links discovered back in.  An incomplete remove thus
 	 * makes no change to the link count but an add increases
 	 * by one.
 	 */
 	if (debug)
 		printf(
 		    "ino %ju nlink %ju newlinks %ju removes %ju dotlinks %ju\n",
 		    (uintmax_t)ino, (uintmax_t)nlink, (uintmax_t)newlinks,
 		    (uintmax_t)removes, (uintmax_t)dotlinks);
 	nlink += newlinks;
 	nlink -= removes;
 	sino->si_linkadj = 1;
 	sino->si_nlink = nlink;
 	sino->si_dotlinks = dotlinks;
 	sino->si_mode = mode;
 	ino_adjust(sino);
 }
 
 /*
  * Process records available for one block and determine whether it is
  * still allocated and whether the owning inode needs to be updated or
  * a free completed.
  */
 static void
 blk_check(struct suj_blk *sblk)
 {
 	struct suj_rec *srec;
 	struct jblkrec *brec;
 	struct suj_ino *sino;
 	ufs2_daddr_t blk;
 	int mask;
 	int frags;
 	int isat;
 
 	/*
 	 * Each suj_blk actually contains records for any fragments in that
 	 * block.  As a result we must evaluate each record individually.
 	 */
 	sino = NULL;
 	TAILQ_FOREACH(srec, &sblk->sb_recs, sr_next) {
 		brec = (struct jblkrec *)srec->sr_rec;
 		frags = brec->jb_frags;
 		blk = brec->jb_blkno + brec->jb_oldfrags;
 		isat = blk_isat(brec->jb_ino, brec->jb_lbn, blk, &frags);
 		if (sino == NULL || sino->si_ino != brec->jb_ino) {
 			sino = ino_lookup(brec->jb_ino, 1);
 			sino->si_blkadj = 1;
 		}
 		if (debug)
 			printf("op %d blk %jd ino %ju lbn %jd frags %d isat %d (%d)\n",
 			    brec->jb_op, blk, (uintmax_t)brec->jb_ino,
 			    brec->jb_lbn, brec->jb_frags, isat, frags);
 		/*
 		 * If we found the block at this address we still have to
 		 * determine if we need to free the tail end that was
 		 * added by adding contiguous fragments from the same block.
 		 */
 		if (isat == 1) {
 			if (frags == brec->jb_frags)
 				continue;
 			mask = blk_freemask(blk, brec->jb_ino, brec->jb_lbn,
 			    brec->jb_frags);
 			mask >>= frags;
 			blk += frags;
 			frags = brec->jb_frags - frags;
 			blk_free(brec->jb_ino, blk, mask, frags);
 			continue;
 		}
 		/*
 	 	 * The block wasn't found, attempt to free it.  It won't be
 		 * freed if it was actually reallocated.  If this was an
 		 * allocation we don't want to follow indirects as they
 		 * may not be written yet.  Any children of the indirect will
 		 * have their own records.  If it's a free we need to
 		 * recursively free children.
 		 */
 		blk_free_lbn(blk, brec->jb_ino, brec->jb_lbn, brec->jb_frags,
 		    brec->jb_op == JOP_FREEBLK);
 	}
 }
 
 /*
  * Walk the list of inode records for this cg and resolve moved and duplicate
  * inode references now that we have a complete picture.
  */
 static void
 cg_build(struct suj_cg *sc)
 {
 	struct suj_ino *sino;
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_FOREACH(sino, &sc->sc_inohash[i], si_next)
 			ino_build(sino);
 }
 
 /*
  * Handle inodes requiring truncation.  This must be done prior to
  * looking up any inodes in directories.
  */
 static void
 cg_trunc(struct suj_cg *sc)
 {
 	struct suj_ino *sino;
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++) {
 		LIST_FOREACH(sino, &sc->sc_inohash[i], si_next) {
 			if (sino->si_trunc) {
 				ino_trunc(sino->si_ino,
 				    sino->si_trunc->jt_size);
 				sino->si_blkadj = 0;
 				sino->si_trunc = NULL;
 			}
 			if (sino->si_blkadj)
 				ino_adjblks(sino);
 		}
 	}
 }
 
 static void
 cg_adj_blk(struct suj_cg *sc)
 {
 	struct suj_ino *sino;
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++) {
 		LIST_FOREACH(sino, &sc->sc_inohash[i], si_next) {
 			if (sino->si_blkadj)
 				ino_adjblks(sino);
 		}
 	}
 }
 
 /*
  * Free any partially allocated blocks and then resolve inode block
  * counts.
  */
 static void
 cg_check_blk(struct suj_cg *sc)
 {
 	struct suj_blk *sblk;
 	int i;
 
 
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_FOREACH(sblk, &sc->sc_blkhash[i], sb_next)
 			blk_check(sblk);
 }
 
 /*
  * Walk the list of inode records for this cg, recovering any
  * changes which were not complete at the time of crash.
  */
 static void
 cg_check_ino(struct suj_cg *sc)
 {
 	struct suj_ino *sino;
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_FOREACH(sino, &sc->sc_inohash[i], si_next)
 			ino_check(sino);
 }
 
 static void
 cg_apply(void (*apply)(struct suj_cg *))
 {
 	struct suj_cg *scg;
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_FOREACH(scg, &cghash[i], sc_next)
 			apply(scg);
 }
 
 /*
  * Process the unlinked but referenced file list.  Freeing all inodes.
  */
 static void
 ino_unlinked(void)
 {
 	struct inode ip;
 	union dinode *dp;
 	uint16_t mode;
 	ino_t inon;
 	ino_t ino;
 
 	ino = fs->fs_sujfree;
 	fs->fs_sujfree = 0;
 	while (ino != 0) {
 		ginode(ino, &ip);
 		dp = ip.i_dp;
 		mode = DIP(dp, di_mode) & IFMT;
 		inon = DIP(dp, di_freelink);
 		DIP_SET(dp, di_freelink, 0);
 		inodirty(&ip);
 		/*
 		 * XXX Should this be an errx?
 		 */
 		if (DIP(dp, di_nlink) == 0) {
 			if (debug)
 				printf("Freeing unlinked ino %ju mode %o\n",
 				    (uintmax_t)ino, mode);
 			ino_reclaim(&ip, ino, mode);
 		} else if (debug)
 			printf("Skipping ino %ju mode %o with link %d\n",
 			    (uintmax_t)ino, mode, DIP(dp, di_nlink));
 		ino = inon;
 		irelse(&ip);
 	}
 }
 
 /*
  * Append a new record to the list of records requiring processing.
  */
 static void
 ino_append(union jrec *rec)
 {
 	struct jrefrec *refrec;
 	struct jmvrec *mvrec;
 	struct suj_ino *sino;
 	struct suj_rec *srec;
 
 	mvrec = &rec->rec_jmvrec;
 	refrec = &rec->rec_jrefrec;
 	if (debug && mvrec->jm_op == JOP_MVREF)
 		printf("ino move: ino %ju, parent %ju, "
 		    "diroff %jd, oldoff %jd\n",
 		    (uintmax_t)mvrec->jm_ino, (uintmax_t)mvrec->jm_parent,
 		    (uintmax_t)mvrec->jm_newoff, (uintmax_t)mvrec->jm_oldoff);
 	else if (debug &&
 	    (refrec->jr_op == JOP_ADDREF || refrec->jr_op == JOP_REMREF))
 		printf("ino ref: op %d, ino %ju, nlink %ju, "
 		    "parent %ju, diroff %jd\n",
 		    refrec->jr_op, (uintmax_t)refrec->jr_ino,
 		    (uintmax_t)refrec->jr_nlink,
 		    (uintmax_t)refrec->jr_parent, (uintmax_t)refrec->jr_diroff);
 	sino = ino_lookup(((struct jrefrec *)rec)->jr_ino, 1);
 	sino->si_hasrecs = 1;
 	srec = errmalloc(sizeof(*srec));
 	srec->sr_rec = rec;
 	TAILQ_INSERT_TAIL(&sino->si_newrecs, srec, sr_next);
 }
 
 /*
  * Add a reference adjustment to the sino list and eliminate dups.  The
  * primary loop in ino_build_ref() checks for dups but new ones may be
  * created as a result of offset adjustments.
  */
 static void
 ino_add_ref(struct suj_ino *sino, struct suj_rec *srec)
 {
 	struct jrefrec *refrec;
 	struct suj_rec *srn;
 	struct jrefrec *rrn;
 
 	refrec = (struct jrefrec *)srec->sr_rec;
 	/*
 	 * We walk backwards so that the oldest link count is preserved.  If
 	 * an add record conflicts with a remove keep the remove.  Redundant
 	 * removes are eliminated in ino_build_ref.  Otherwise we keep the
 	 * oldest record at a given location.
 	 */
 	for (srn = TAILQ_LAST(&sino->si_recs, srechd); srn;
 	    srn = TAILQ_PREV(srn, srechd, sr_next)) {
 		rrn = (struct jrefrec *)srn->sr_rec;
 		if (rrn->jr_parent != refrec->jr_parent ||
 		    rrn->jr_diroff != refrec->jr_diroff)
 			continue;
 		if (rrn->jr_op == JOP_REMREF || refrec->jr_op == JOP_ADDREF) {
 			rrn->jr_mode = refrec->jr_mode;
 			return;
 		}
 		/*
 		 * Adding a remove.
 		 *
 		 * Replace the record in place with the old nlink in case
 		 * we replace the head of the list.  Abandon srec as a dup.
 		 */
 		refrec->jr_nlink = rrn->jr_nlink;
 		srn->sr_rec = srec->sr_rec;
 		return;
 	}
 	TAILQ_INSERT_TAIL(&sino->si_recs, srec, sr_next);
 }
 
 /*
  * Create a duplicate of a reference at a previous location.
  */
 static void
 ino_dup_ref(struct suj_ino *sino, struct jrefrec *refrec, off_t diroff)
 {
 	struct jrefrec *rrn;
 	struct suj_rec *srn;
 
 	rrn = errmalloc(sizeof(*refrec));
 	*rrn = *refrec;
 	rrn->jr_op = JOP_ADDREF;
 	rrn->jr_diroff = diroff;
 	srn = errmalloc(sizeof(*srn));
 	srn->sr_rec = (union jrec *)rrn;
 	ino_add_ref(sino, srn);
 }
 
 /*
  * Add a reference to the list at all known locations.  We follow the offset
  * changes for a single instance and create duplicate add refs at each so
  * that we can tolerate any version of the directory block.  Eliminate
  * removes which collide with adds that are seen in the journal.  They should
  * not adjust the link count down.
  */
 static void
 ino_build_ref(struct suj_ino *sino, struct suj_rec *srec)
 {
 	struct jrefrec *refrec;
 	struct jmvrec *mvrec;
 	struct suj_rec *srp;
 	struct suj_rec *srn;
 	struct jrefrec *rrn;
 	off_t diroff;
 
 	refrec = (struct jrefrec *)srec->sr_rec;
 	/*
 	 * Search for a mvrec that matches this offset.  Whether it's an add
 	 * or a remove we can delete the mvref after creating a dup record in
 	 * the old location.
 	 */
 	if (!TAILQ_EMPTY(&sino->si_movs)) {
 		diroff = refrec->jr_diroff;
 		for (srn = TAILQ_LAST(&sino->si_movs, srechd); srn; srn = srp) {
 			srp = TAILQ_PREV(srn, srechd, sr_next);
 			mvrec = (struct jmvrec *)srn->sr_rec;
 			if (mvrec->jm_parent != refrec->jr_parent ||
 			    mvrec->jm_newoff != diroff)
 				continue;
 			diroff = mvrec->jm_oldoff;
 			TAILQ_REMOVE(&sino->si_movs, srn, sr_next);
 			free(srn);
 			ino_dup_ref(sino, refrec, diroff);
 		}
 	}
 	/*
 	 * If a remove wasn't eliminated by an earlier add just append it to
 	 * the list.
 	 */
 	if (refrec->jr_op == JOP_REMREF) {
 		ino_add_ref(sino, srec);
 		return;
 	}
 	/*
 	 * Walk the list of records waiting to be added to the list.  We
 	 * must check for moves that apply to our current offset and remove
 	 * them from the list.  Remove any duplicates to eliminate removes
 	 * with corresponding adds.
 	 */
 	TAILQ_FOREACH_SAFE(srn, &sino->si_newrecs, sr_next, srp) {
 		switch (srn->sr_rec->rec_jrefrec.jr_op) {
 		case JOP_ADDREF:
 			/*
 			 * This should actually be an error we should
 			 * have a remove for every add journaled.
 			 */
 			rrn = (struct jrefrec *)srn->sr_rec;
 			if (rrn->jr_parent != refrec->jr_parent ||
 			    rrn->jr_diroff != refrec->jr_diroff)
 				break;
 			TAILQ_REMOVE(&sino->si_newrecs, srn, sr_next);
 			break;
 		case JOP_REMREF:
 			/*
 			 * Once we remove the current iteration of the
 			 * record at this address we're done.
 			 */
 			rrn = (struct jrefrec *)srn->sr_rec;
 			if (rrn->jr_parent != refrec->jr_parent ||
 			    rrn->jr_diroff != refrec->jr_diroff)
 				break;
 			TAILQ_REMOVE(&sino->si_newrecs, srn, sr_next);
 			ino_add_ref(sino, srec);
 			return;
 		case JOP_MVREF:
 			/*
 			 * Update our diroff based on any moves that match
 			 * and remove the move.
 			 */
 			mvrec = (struct jmvrec *)srn->sr_rec;
 			if (mvrec->jm_parent != refrec->jr_parent ||
 			    mvrec->jm_oldoff != refrec->jr_diroff)
 				break;
 			ino_dup_ref(sino, refrec, mvrec->jm_oldoff);
 			refrec->jr_diroff = mvrec->jm_newoff;
 			TAILQ_REMOVE(&sino->si_newrecs, srn, sr_next);
 			break;
 		default:
 			err_suj("ino_build_ref: Unknown op %d\n",
 			    srn->sr_rec->rec_jrefrec.jr_op);
 		}
 	}
 	ino_add_ref(sino, srec);
 }
 
 /*
  * Walk the list of new records and add them in-order resolving any
  * dups and adjusted offsets.
  */
 static void
 ino_build(struct suj_ino *sino)
 {
 	struct suj_rec *srec;
 
 	while ((srec = TAILQ_FIRST(&sino->si_newrecs)) != NULL) {
 		TAILQ_REMOVE(&sino->si_newrecs, srec, sr_next);
 		switch (srec->sr_rec->rec_jrefrec.jr_op) {
 		case JOP_ADDREF:
 		case JOP_REMREF:
 			ino_build_ref(sino, srec);
 			break;
 		case JOP_MVREF:
 			/*
 			 * Add this mvrec to the queue of pending mvs.
 			 */
 			TAILQ_INSERT_TAIL(&sino->si_movs, srec, sr_next);
 			break;
 		default:
 			err_suj("ino_build: Unknown op %d\n",
 			    srec->sr_rec->rec_jrefrec.jr_op);
 		}
 	}
 	if (TAILQ_EMPTY(&sino->si_recs))
 		sino->si_hasrecs = 0;
 }
 
 /*
  * Modify journal records so they refer to the base block number
  * and a start and end frag range.  This is to facilitate the discovery
  * of overlapping fragment allocations.
  */
 static void
 blk_build(struct jblkrec *blkrec)
 {
 	struct suj_rec *srec;
 	struct suj_blk *sblk;
 	struct jblkrec *blkrn;
 	ufs2_daddr_t blk;
 	int frag;
 
 	if (debug)
 		printf("blk_build: op %d blkno %jd frags %d oldfrags %d "
 		    "ino %ju lbn %jd\n",
 		    blkrec->jb_op, (uintmax_t)blkrec->jb_blkno,
 		    blkrec->jb_frags, blkrec->jb_oldfrags,
 		    (uintmax_t)blkrec->jb_ino, (uintmax_t)blkrec->jb_lbn);
 
 	blk = blknum(fs, blkrec->jb_blkno);
 	frag = fragnum(fs, blkrec->jb_blkno);
 	sblk = blk_lookup(blk, 1);
 	/*
 	 * Rewrite the record using oldfrags to indicate the offset into
 	 * the block.  Leave jb_frags as the actual allocated count.
 	 */
 	blkrec->jb_blkno -= frag;
 	blkrec->jb_oldfrags = frag;
 	if (blkrec->jb_oldfrags + blkrec->jb_frags > fs->fs_frag)
 		err_suj("Invalid fragment count %d oldfrags %d\n",
 		    blkrec->jb_frags, frag);
 	/*
 	 * Detect dups.  If we detect a dup we always discard the oldest
 	 * record as it is superseded by the new record.  This speeds up
 	 * later stages but also eliminates free records which are used
 	 * to indicate that the contents of indirects can be trusted.
 	 */
 	TAILQ_FOREACH(srec, &sblk->sb_recs, sr_next) {
 		blkrn = (struct jblkrec *)srec->sr_rec;
 		if (blkrn->jb_ino != blkrec->jb_ino ||
 		    blkrn->jb_lbn != blkrec->jb_lbn ||
 		    blkrn->jb_blkno != blkrec->jb_blkno ||
 		    blkrn->jb_frags != blkrec->jb_frags ||
 		    blkrn->jb_oldfrags != blkrec->jb_oldfrags)
 			continue;
 		if (debug)
 			printf("Removed dup.\n");
 		/* Discard the free which is a dup with an alloc. */
 		if (blkrec->jb_op == JOP_FREEBLK)
 			return;
 		TAILQ_REMOVE(&sblk->sb_recs, srec, sr_next);
 		free(srec);
 		break;
 	}
 	srec = errmalloc(sizeof(*srec));
 	srec->sr_rec = (union jrec *)blkrec;
 	TAILQ_INSERT_TAIL(&sblk->sb_recs, srec, sr_next);
 }
 
 static void
 ino_build_trunc(struct jtrncrec *rec)
 {
 	struct suj_ino *sino;
 
 	if (debug)
 		printf("ino_build_trunc: op %d ino %ju, size %jd\n",
 		    rec->jt_op, (uintmax_t)rec->jt_ino,
 		    (uintmax_t)rec->jt_size);
 	sino = ino_lookup(rec->jt_ino, 1);
 	if (rec->jt_op == JOP_SYNC) {
 		sino->si_trunc = NULL;
 		return;
 	}
 	if (sino->si_trunc == NULL || sino->si_trunc->jt_size > rec->jt_size)
 		sino->si_trunc = rec;
 }
 
 /*
  * Build up tables of the operations we need to recover.
  */
 static void
 suj_build(void)
 {
 	struct suj_seg *seg;
 	union jrec *rec;
 	int off;
 	int i;
 
 	TAILQ_FOREACH(seg, &allsegs, ss_next) {
 		if (debug)
 			printf("seg %jd has %d records, oldseq %jd.\n",
 			    seg->ss_rec.jsr_seq, seg->ss_rec.jsr_cnt,
 			    seg->ss_rec.jsr_oldest);
 		off = 0;
 		rec = (union jrec *)seg->ss_blk;
 		for (i = 0; i < seg->ss_rec.jsr_cnt; off += JREC_SIZE, rec++) {
 			/* skip the segrec. */
 			if ((off % real_dev_bsize) == 0)
 				continue;
 			switch (rec->rec_jrefrec.jr_op) {
 			case JOP_ADDREF:
 			case JOP_REMREF:
 			case JOP_MVREF:
 				ino_append(rec);
 				break;
 			case JOP_NEWBLK:
 			case JOP_FREEBLK:
 				blk_build((struct jblkrec *)rec);
 				break;
 			case JOP_TRUNC:
 			case JOP_SYNC:
 				ino_build_trunc((struct jtrncrec *)rec);
 				break;
 			default:
 				err_suj("Unknown journal operation %d (%d)\n",
 				    rec->rec_jrefrec.jr_op, off);
 			}
 			i++;
 		}
 	}
 }
 
 /*
  * Prune the journal segments to those we care about based on the
  * oldest sequence in the newest segment.  Order the segment list
  * based on sequence number.
  */
 static void
 suj_prune(void)
 {
 	struct suj_seg *seg;
 	struct suj_seg *segn;
 	uint64_t newseq;
 	int discard;
 
 	if (debug)
 		printf("Pruning up to %jd\n", oldseq);
 	/* First free the expired segments. */
 	TAILQ_FOREACH_SAFE(seg, &allsegs, ss_next, segn) {
 		if (seg->ss_rec.jsr_seq >= oldseq)
 			continue;
 		TAILQ_REMOVE(&allsegs, seg, ss_next);
 		free(seg->ss_blk);
 		free(seg);
 	}
 	/* Next ensure that segments are ordered properly. */
 	seg = TAILQ_FIRST(&allsegs);
 	if (seg == NULL) {
 		if (debug)
 			printf("Empty journal\n");
 		return;
 	}
 	newseq = seg->ss_rec.jsr_seq;
 	for (;;) {
 		seg = TAILQ_LAST(&allsegs, seghd);
 		if (seg->ss_rec.jsr_seq >= newseq)
 			break;
 		TAILQ_REMOVE(&allsegs, seg, ss_next);
 		TAILQ_INSERT_HEAD(&allsegs, seg, ss_next);
 		newseq = seg->ss_rec.jsr_seq;
 
 	}
 	if (newseq != oldseq) {
 		TAILQ_FOREACH(seg, &allsegs, ss_next) {
 			printf("%jd, ", seg->ss_rec.jsr_seq);
 		}
 		printf("\n");
 		err_suj("Journal file sequence mismatch %jd != %jd\n",
 		    newseq, oldseq);
 	}
 	/*
 	 * The kernel may asynchronously write segments which can create
 	 * gaps in the sequence space.  Throw away any segments after the
 	 * gap as the kernel guarantees only those that are contiguously
 	 * reachable are marked as completed.
 	 */
 	discard = 0;
 	TAILQ_FOREACH_SAFE(seg, &allsegs, ss_next, segn) {
 		if (!discard && newseq++ == seg->ss_rec.jsr_seq) {
 			jrecs += seg->ss_rec.jsr_cnt;
 			jbytes += seg->ss_rec.jsr_blocks * real_dev_bsize;
 			continue;
 		}
 		discard = 1;
 		if (debug)
 			printf("Journal order mismatch %jd != %jd pruning\n",
 			    newseq-1, seg->ss_rec.jsr_seq);
 		TAILQ_REMOVE(&allsegs, seg, ss_next);
 		free(seg->ss_blk);
 		free(seg);
 	}
 	if (debug)
 		printf("Processing journal segments from %jd to %jd\n",
 		    oldseq, newseq-1);
 }
 
 /*
  * Verify the journal inode before attempting to read records.
  */
 static int
 suj_verifyino(union dinode *dp)
 {
 
 	if (DIP(dp, di_nlink) != 1) {
 		printf("Invalid link count %d for journal inode %ju\n",
 		    DIP(dp, di_nlink), (uintmax_t)sujino);
 		return (-1);
 	}
 
 	if ((DIP(dp, di_flags) & (SF_IMMUTABLE | SF_NOUNLINK)) !=
 	    (SF_IMMUTABLE | SF_NOUNLINK)) {
 		printf("Invalid flags 0x%X for journal inode %ju\n",
 		    DIP(dp, di_flags), (uintmax_t)sujino);
 		return (-1);
 	}
 
 	if (DIP(dp, di_mode) != (IFREG | IREAD)) {
 		printf("Invalid mode %o for journal inode %ju\n",
 		    DIP(dp, di_mode), (uintmax_t)sujino);
 		return (-1);
 	}
 
 	if (DIP(dp, di_size) < SUJ_MIN) {
 		printf("Invalid size %jd for journal inode %ju\n",
 		    DIP(dp, di_size), (uintmax_t)sujino);
 		return (-1);
 	}
 
 	if (DIP(dp, di_modrev) != fs->fs_mtime) {
 		printf("Journal timestamp does not match fs mount time\n");
 		return (-1);
 	}
 
 	return (0);
 }
 
 struct jblocks {
 	struct jextent *jb_extent;	/* Extent array. */
 	int		jb_avail;	/* Available extents. */
 	int		jb_used;	/* Last used extent. */
 	int		jb_head;	/* Allocator head. */
 	int		jb_off;		/* Allocator extent offset. */
 };
 struct jextent {
 	ufs2_daddr_t	je_daddr;	/* Disk block address. */
 	int		je_blocks;	/* Disk block count. */
 };
 
 static struct jblocks *suj_jblocks;
 
 static struct jblocks *
 jblocks_create(void)
 {
 	struct jblocks *jblocks;
 	int size;
 
 	jblocks = errmalloc(sizeof(*jblocks));
 	jblocks->jb_avail = 10;
 	jblocks->jb_used = 0;
 	jblocks->jb_head = 0;
 	jblocks->jb_off = 0;
 	size = sizeof(struct jextent) * jblocks->jb_avail;
 	jblocks->jb_extent = errmalloc(size);
 	bzero(jblocks->jb_extent, size);
 
 	return (jblocks);
 }
 
 /*
  * Return the next available disk block and the amount of contiguous
  * free space it contains.
  */
 static ufs2_daddr_t
 jblocks_next(struct jblocks *jblocks, int bytes, int *actual)
 {
 	struct jextent *jext;
 	ufs2_daddr_t daddr;
 	int freecnt;
 	int blocks;
 
 	blocks = btodb(bytes);
 	jext = &jblocks->jb_extent[jblocks->jb_head];
 	freecnt = jext->je_blocks - jblocks->jb_off;
 	if (freecnt == 0) {
 		jblocks->jb_off = 0;
 		if (++jblocks->jb_head > jblocks->jb_used)
 			return (0);
 		jext = &jblocks->jb_extent[jblocks->jb_head];
 		freecnt = jext->je_blocks;
 	}
 	if (freecnt > blocks)
 		freecnt = blocks;
 	*actual = dbtob(freecnt);
 	daddr = jext->je_daddr + jblocks->jb_off;
 
 	return (daddr);
 }
 
 /*
  * Advance the allocation head by a specified number of bytes, consuming
  * one journal segment.
  */
 static void
 jblocks_advance(struct jblocks *jblocks, int bytes)
 {
 
 	jblocks->jb_off += btodb(bytes);
 }
 
 static void
 jblocks_destroy(struct jblocks *jblocks)
 {
 
 	free(jblocks->jb_extent);
 	free(jblocks);
 }
 
 static void
 jblocks_add(struct jblocks *jblocks, ufs2_daddr_t daddr, int blocks)
 {
 	struct jextent *jext;
 	int size;
 
 	jext = &jblocks->jb_extent[jblocks->jb_used];
 	/* Adding the first block. */
 	if (jext->je_daddr == 0) {
 		jext->je_daddr = daddr;
 		jext->je_blocks = blocks;
 		return;
 	}
 	/* Extending the last extent. */
 	if (jext->je_daddr + jext->je_blocks == daddr) {
 		jext->je_blocks += blocks;
 		return;
 	}
 	/* Adding a new extent. */
 	if (++jblocks->jb_used == jblocks->jb_avail) {
 		jblocks->jb_avail *= 2;
 		size = sizeof(struct jextent) * jblocks->jb_avail;
 		jext = errmalloc(size);
 		bzero(jext, size);
 		bcopy(jblocks->jb_extent, jext,
 		    sizeof(struct jextent) * jblocks->jb_used);
 		free(jblocks->jb_extent);
 		jblocks->jb_extent = jext;
 	}
 	jext = &jblocks->jb_extent[jblocks->jb_used];
 	jext->je_daddr = daddr;
 	jext->je_blocks = blocks;
 
 	return;
 }
 
 /*
  * Add a file block from the journal to the extent map.  We can't read
  * each file block individually because the kernel treats it as a circular
  * buffer and segments may span mutliple contiguous blocks.
  */
 static void
 suj_add_block(ino_t ino, ufs_lbn_t lbn, ufs2_daddr_t blk, int frags)
 {
 
 	jblocks_add(suj_jblocks, fsbtodb(fs, blk), fsbtodb(fs, frags));
 }
 
 static void
 suj_read(void)
 {
 	uint8_t block[1 * 1024 * 1024];
 	struct suj_seg *seg;
 	struct jsegrec *recn;
 	struct jsegrec *rec;
 	ufs2_daddr_t blk;
 	int readsize;
 	int blocks;
 	int recsize;
 	int size;
 	int i;
 
 	/*
 	 * Read records until we exhaust the journal space.  If we find
 	 * an invalid record we start searching for a valid segment header
 	 * at the next block.  This is because we don't have a head/tail
 	 * pointer and must recover the information indirectly.  At the gap
 	 * between the head and tail we won't necessarily have a valid
 	 * segment.
 	 */
 restart:
 	for (;;) {
 		size = sizeof(block);
 		blk = jblocks_next(suj_jblocks, size, &readsize);
 		if (blk == 0)
 			return;
 		size = readsize;
 		/*
 		 * Read 1MB at a time and scan for records within this block.
 		 */
 		if (pread(fsreadfd, &block, size, dbtob(blk)) != size) {
 			err_suj("Error reading journal block %jd\n",
 			    (intmax_t)blk);
 		}
 		for (rec = (void *)block; size; size -= recsize,
 		    rec = (struct jsegrec *)((uintptr_t)rec + recsize)) {
 			recsize = real_dev_bsize;
 			if (rec->jsr_time != fs->fs_mtime) {
 #ifdef notdef
 				if (debug)
 					printf("Rec time %jd != fs mtime %jd\n",
 					    rec->jsr_time, fs->fs_mtime);
 #endif
 				jblocks_advance(suj_jblocks, recsize);
 				continue;
 			}
 			if (rec->jsr_cnt == 0) {
 				if (debug)
 					printf("Found illegal count %d\n",
 					    rec->jsr_cnt);
 				jblocks_advance(suj_jblocks, recsize);
 				continue;
 			}
 			blocks = rec->jsr_blocks;
 			recsize = blocks * real_dev_bsize;
 			if (recsize > size) {
 				/*
 				 * We may just have run out of buffer, restart
 				 * the loop to re-read from this spot.
 				 */
 				if (size < fs->fs_bsize &&
 				    size != readsize &&
 				    recsize <= fs->fs_bsize)
 					goto restart;
 				if (debug)
 					printf("Found invalid segsize %d > %d\n",
 					    recsize, size);
 				recsize = real_dev_bsize;
 				jblocks_advance(suj_jblocks, recsize);
 				continue;
 			}
 			/*
 			 * Verify that all blocks in the segment are present.
 			 */
 			for (i = 1; i < blocks; i++) {
 				recn = (void *)((uintptr_t)rec) + i *
 				    real_dev_bsize;
 				if (recn->jsr_seq == rec->jsr_seq &&
 				    recn->jsr_time == rec->jsr_time)
 					continue;
 				if (debug)
 					printf("Incomplete record %jd (%d)\n",
 					    rec->jsr_seq, i);
 				recsize = i * real_dev_bsize;
 				jblocks_advance(suj_jblocks, recsize);
 				goto restart;
 			}
 			seg = errmalloc(sizeof(*seg));
 			seg->ss_blk = errmalloc(recsize);
 			seg->ss_rec = *rec;
 			bcopy((void *)rec, seg->ss_blk, recsize);
 			if (rec->jsr_oldest > oldseq)
 				oldseq = rec->jsr_oldest;
 			TAILQ_INSERT_TAIL(&allsegs, seg, ss_next);
 			jblocks_advance(suj_jblocks, recsize);
 		}
 	}
 }
 
 /*
  * Orchestrate the verification of a filesystem via the softupdates journal.
  */
 int
 suj_check(const char *filesys)
 {
 	struct inodesc idesc;
 	struct csum *cgsum;
 	union dinode *jip;
 	struct inode ip;
 	uint64_t blocks;
 	int i, retval;
 	struct suj_seg *seg;
 	struct suj_seg *segn;
 
 	initsuj();
 	fs = &sblock;
 	if (real_dev_bsize == 0 && ioctl(fsreadfd, DIOCGSECTORSIZE,
 	    &real_dev_bsize) == -1)
 		real_dev_bsize = secsize;
 	if (debug)
 		printf("dev_bsize %u\n", real_dev_bsize);
 
 	/*
 	 * Set an exit point when SUJ check failed
 	 */
 	retval = setjmp(jmpbuf);
 	if (retval != 0) {
 		pwarn("UNEXPECTED SU+J INCONSISTENCY\n");
 		TAILQ_FOREACH_SAFE(seg, &allsegs, ss_next, segn) {
 			TAILQ_REMOVE(&allsegs, seg, ss_next);
 				free(seg->ss_blk);
 				free(seg);
 		}
 		if (reply("FALLBACK TO FULL FSCK") == 0) {
 			ckfini(0);
 			exit(EEXIT);
 		} else
 			return (-1);
 	}
 
 	/*
 	 * Search the root directory for the SUJ_FILE.
 	 */
 	idesc.id_type = DATA;
 	idesc.id_fix = IGNORE;
 	idesc.id_number = UFS_ROOTINO;
 	idesc.id_func = findino;
 	idesc.id_name = SUJ_FILE;
 	ginode(UFS_ROOTINO, &ip);
 	if ((ckinode(ip.i_dp, &idesc) & FOUND) == FOUND) {
 		sujino = idesc.id_parent;
 		irelse(&ip);
 	} else {
 		printf("Journal inode removed.  Use tunefs to re-create.\n");
 		sblock.fs_flags &= ~FS_SUJ;
 		sblock.fs_sujfree = 0;
 		irelse(&ip);
 		return (-1);
 	}
 	/*
 	 * Fetch the journal inode and verify it.
 	 */
 	ginode(sujino, &ip);
 	jip = ip.i_dp;
 	printf("** SU+J Recovering %s\n", filesys);
 	if (suj_verifyino(jip) != 0 || (!preen && !reply("USE JOURNAL"))) {
 		irelse(&ip);
 		return (-1);
 	}
 	/*
 	 * Build a list of journal blocks in jblocks before parsing the
 	 * available journal blocks in with suj_read().
 	 */
 	printf("** Reading %jd byte journal from inode %ju.\n",
 	    DIP(jip, di_size), (uintmax_t)sujino);
 	suj_jblocks = jblocks_create();
 	blocks = ino_visit(jip, sujino, suj_add_block, 0);
 	if (blocks != numfrags(fs, DIP(jip, di_size))) {
 		printf("Sparse journal inode %ju.\n", (uintmax_t)sujino);
 		irelse(&ip);
 		return (-1);
 	}
 	irelse(&ip);
 	suj_read();
 	jblocks_destroy(suj_jblocks);
 	suj_jblocks = NULL;
 	if (preen || reply("RECOVER")) {
 		printf("** Building recovery table.\n");
 		suj_prune();
 		suj_build();
 		cg_apply(cg_build);
 		printf("** Resolving unreferenced inode list.\n");
 		ino_unlinked();
 		printf("** Processing journal entries.\n");
 		cg_apply(cg_trunc);
 		cg_apply(cg_check_blk);
 		cg_apply(cg_adj_blk);
 		cg_apply(cg_check_ino);
 	}
 	if (preen == 0 && (jrecs > 0 || jbytes > 0) && reply("WRITE CHANGES") == 0)
 		return (0);
 	/*
 	 * Check block counts of snapshot inodes and
 	 * make copies of any needed snapshot blocks.
 	 */
 	for (i = 0; i < snapcnt; i++)
 		check_blkcnt(&snaplist[i]);
 	snapflush(suj_checkblkavail);
 	/*
 	 * Recompute the fs summary info from correct cs summaries.
 	 */
 	bzero(&fs->fs_cstotal, sizeof(struct csum_total));
 	for (i = 0; i < fs->fs_ncg; i++) {
 		cgsum = &fs->fs_cs(fs, i);
 		fs->fs_cstotal.cs_nffree += cgsum->cs_nffree;
 		fs->fs_cstotal.cs_nbfree += cgsum->cs_nbfree;
 		fs->fs_cstotal.cs_nifree += cgsum->cs_nifree;
 		fs->fs_cstotal.cs_ndir += cgsum->cs_ndir;
 	}
 	fs->fs_pendinginodes = 0;
 	fs->fs_pendingblocks = 0;
 	fs->fs_clean = 1;
 	fs->fs_time = time(NULL);
 	fs->fs_mtime = time(NULL);
 	sbdirty();
 	ckfini(1);
 	if (jrecs > 0 || jbytes > 0) {
 		printf("** %jd journal records in %jd bytes for %.2f%% utilization\n",
 		    jrecs, jbytes, ((float)jrecs / (float)(jbytes / JREC_SIZE)) * 100);
 		printf("** Freed %jd inodes (%jd dirs) %jd blocks, and %jd frags.\n",
 		    freeinos, freedir, freeblocks, freefrags);
 	}
 
 	return (0);
 }
 
 static void
 initsuj(void)
 {
 	int i;
 
 	for (i = 0; i < HASHSIZE; i++)
 		LIST_INIT(&cghash[i]);
 	lastcg = NULL;
 	TAILQ_INIT(&allsegs);
 	oldseq = 0;
 	fs = NULL;
 	sujino = 0;
 	freefrags = 0;
 	freeblocks = 0;
 	freeinos = 0;
 	freedir = 0;
 	jbytes = 0;
 	jrecs = 0;
 	suj_jblocks = NULL;
 }
diff --git a/tools/diag/prtblknos/main.c b/tools/diag/prtblknos/main.c
index 25a717760922..1535755ea52e 100644
--- a/tools/diag/prtblknos/main.c
+++ b/tools/diag/prtblknos/main.c
@@ -1,109 +1,107 @@
 /*
  * Copyright (c) 1998, 2003, 2013, 2018 Marshall Kirk McKusick.
  * All Rights Reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY MARSHALL KIRK MCKUSICK ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL MARSHALL KIRK MCKUSICK BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * $FreeBSD$
  */
 
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <stdlib.h>
 #include <stdio.h>
 #include <sys/stat.h>
 #include <libufs.h>
 
 union dinode {
 	struct ufs1_dinode *dp1;
 	struct ufs2_dinode *dp2;
 };
 
 void prtblknos(struct fs *fs, union dinode *dp);
 
 struct uufsd disk;
 
 int
-main(argc, argv)
-	int argc;
-	char *argv[];
+main(int argc, char *argv[])
 {
 	union dinodep dp;
 	struct fs *fs;
 	struct stat sb;
 	struct statfs sfb;
 	char *xargv[4];
 	char ibuf[64];
 	char *fsname, *filename;
 	ino_t inonum;
 	int error;
 
 	filename = NULL;
 	if (argc == 2) {
 		filename = argv[1];
 		if (lstat(filename, &sb) != 0)
 			err(1, "stat(%s)", filename);
 		if (statfs(filename, &sfb) != 0)
 			err(1, "statfs(%s)", filename);
 		xargv[0] = argv[0];
 		xargv[1] = sfb.f_mntfromname;
 		sprintf(ibuf, "%jd", (intmax_t)sb.st_ino);
 		xargv[2] = ibuf;
 		xargv[3] = NULL;
 		argv = xargv;
 		argc = 3;
 	}
 	if (argc < 3) {
 		(void)fprintf(stderr, "%s\n%s\n",
 		    "usage: prtblknos filename",
 		    "       prtblknos filesystem inode ...");
 		exit(1);
 	}
 
 	fsname = *++argv;
 
 	/* get the superblock. */
 	if ((error = ufs_disk_fillout(&disk, fsname)) < 0)
 		err(1, "Cannot access file system superblock on %s", fsname);
 	fs = (struct fs *)&disk.d_sb;
 
 	/* remaining arguments are inode numbers. */
 	while (*++argv) {
 		/* get the inode number. */
 		if ((inonum = atoi(*argv)) <= 0 ||
 		     inonum >= (ino_t)fs->fs_ipg * fs->fs_ncg)
 			warnx("%s is not a valid inode number", *argv);
 		if (filename == NULL)
 			(void)printf("inode #%jd: ", (intmax_t)inonum);
 		else
 			(void)printf("%s (inode #%jd): ", filename,
 			    (intmax_t)inonum);
 
 		if ((error = getinode(&disk, &dp, inonum)) < 0)
 			warn("Read of inode %jd on %s failed: %s",
 			    (intmax_t)inonum, fsname, disk.d_error);
 
 		prtblknos(fs, (union dinode *)dp.dp1);
 	}
 	exit(0);
 }
diff --git a/tools/diag/prtblknos/prtblknos.c b/tools/diag/prtblknos/prtblknos.c
index ae53471156a6..d6135f70eb46 100644
--- a/tools/diag/prtblknos/prtblknos.c
+++ b/tools/diag/prtblknos/prtblknos.c
@@ -1,322 +1,308 @@
 /*
  * Copyright (c) 1998, 2003, 2013, 2018 Marshall Kirk McKusick.
  * All Rights Reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY MARSHALL KIRK MCKUSICK ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL MARSHALL KIRK MCKUSICK BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  *
  * $FreeBSD$
  */
 
 #include <sys/param.h>
 #include <ufs/ffs/fs.h>
 
 #include <err.h>
 #include <stdio.h>
 #include <string.h>
 #include <libufs.h>
 
 #ifdef PRTBLKNOS
 union dinode {
 	struct ufs1_dinode dp1;
 	struct ufs2_dinode dp2;
 };
 extern struct uufsd disk;
 #else /* used by fsdb */
 #include <fsck.h>
 static struct bufarea *bp;
 #endif
 
 void prtblknos(struct fs *fs, union dinode *dp);
 
 static const char *distance(struct fs *, ufs2_daddr_t, ufs2_daddr_t);
 static void  printblk(struct fs *, ufs_lbn_t, ufs2_daddr_t, int, ufs_lbn_t);
 static void  indirprt(struct fs *, int, ufs_lbn_t, ufs_lbn_t, ufs2_daddr_t,
 		ufs_lbn_t);
 
 void
-prtblknos(fs, dp)
-	struct fs *fs;
-	union dinode *dp;
+prtblknos(struct fs *fs, union dinode *dp)
 {
 	int i, mode, frags;
 	ufs_lbn_t lbn, lastlbn, len, blksperindir;
 	ufs2_daddr_t blkno;
 	off_t size;
 
 	if (fs->fs_magic == FS_UFS1_MAGIC) {
 		size = dp->dp1.di_size;
 		mode = dp->dp1.di_mode;
 	} else {
 		size = dp->dp2.di_size;
 		mode = dp->dp2.di_mode;
 	}
 	switch (mode & IFMT) {
 	default:
 		printf("unknown inode type 0%d\n", (mode & IFMT));
 		return;
 	case 0:
 		printf("unallocated inode\n");
 		return;
 	case IFIFO:
 		printf("fifo\n");
 		return;
 	case IFCHR:
 		printf("character device\n");
 		return;
 	case IFBLK:
 		printf("block device\n");
 		return;
 	case IFSOCK:
 		printf("socket\n");
 		return;
 	case IFWHT:
 		printf("whiteout\n");
 		return;
 	case IFLNK:
 		if (size == 0) {
 			printf("empty symbolic link\n");
 			return;
 		}
 		if (size < fs->fs_maxsymlinklen) {
 			printf("symbolic link referencing %s\n",
 			    (fs->fs_magic == FS_UFS1_MAGIC) ?
 			    dp->dp1.di_shortlink :
 			    dp->dp2.di_shortlink);
 			return;
 		}
 		printf("symbolic link\n");
 		break;
 	case IFREG:
 		if (size == 0) {
 			printf("empty file\n");
 			return;
 		}
 		printf("regular file, size %jd\n", (intmax_t)size);
 		break;
 	case IFDIR:
 		if (size == 0) {
 			printf("empty directory\n");
 			return;
 		}
 		printf("directory, size %jd\n", (intmax_t)size);
 		break;
 	}
 	lastlbn = howmany(size, fs->fs_bsize);
 	len = lastlbn < UFS_NDADDR ? lastlbn : UFS_NDADDR;
 	for (i = 0; i < len; i++) {
 		if (i < lastlbn - 1)
 			frags = fs->fs_frag;
 		else
 			frags = howmany(size - (lastlbn - 1) * fs->fs_bsize,
 					  fs->fs_fsize);
 		if (fs->fs_magic == FS_UFS1_MAGIC)
 			blkno = dp->dp1.di_db[i];
 		else
 			blkno = dp->dp2.di_db[i];
 		printblk(fs, i, blkno, frags, lastlbn);
 	}
 
 	blksperindir = 1;
 	len = lastlbn - UFS_NDADDR;
 	lbn = UFS_NDADDR;
 	for (i = 0; len > 0 && i < UFS_NIADDR; i++) {
 		if (fs->fs_magic == FS_UFS1_MAGIC)
 			blkno = dp->dp1.di_ib[i];
 		else
 			blkno = dp->dp2.di_ib[i];
 		indirprt(fs, i, blksperindir, lbn, blkno, lastlbn);
 		blksperindir *= NINDIR(fs);
 		lbn += blksperindir;
 		len -= blksperindir;
 	}
 
 	/* dummy print to flush out last extent */
 	printblk(fs, lastlbn, 0, frags, 0);
 }
 
 static void
-indirprt(fs, level, blksperindir, lbn, blkno, lastlbn)
-	struct fs *fs;
-	int level;
-	ufs_lbn_t blksperindir;
-	ufs_lbn_t lbn;
-	ufs2_daddr_t blkno;
-	ufs_lbn_t lastlbn;
+indirprt(struct fs *fs, int level, ufs_lbn_t blksperindir, ufs_lbn_t lbn,
+	ufs2_daddr_t blkno, ufs_lbn_t lastlbn)
 {
 	char indir[MAXBSIZE];
 	ufs_lbn_t i, last;
 
 	if (blkno == 0) {
 		printblk(fs, lbn, blkno,
 		    blksperindir * NINDIR(fs) * fs->fs_frag, lastlbn);
 		return;
 	}
 	printblk(fs, lbn, blkno, fs->fs_frag, -level);
 	/* read in the indirect block. */
 #ifdef PRTBLKNOS
 	if (bread(&disk, fsbtodb(fs, blkno), indir, fs->fs_bsize) == -1) {
 #else /* used by fsdb */
 	bp = getdatablk(blkno, fs->fs_bsize, BT_LEVEL1 + level);
 	if (bp->b_errs == 0) {
 		memcpy(indir, bp->b_un.b_buf, fs->fs_bsize);
 	} else {
 #endif
 		warn("Read of indirect block %jd failed", (intmax_t)blkno);
 		/* List the unreadable part as a hole */
 		printblk(fs, lbn, 0,
 		    blksperindir * NINDIR(fs) * fs->fs_frag, lastlbn);
 		return;
 	}
 	last = howmany(lastlbn - lbn, blksperindir) < NINDIR(fs) ?
 	    howmany(lastlbn - lbn, blksperindir) : NINDIR(fs);
 	if (blksperindir == 1) {
 		for (i = 0; i < last; i++) {
 			if (fs->fs_magic == FS_UFS1_MAGIC)
 				blkno = ((ufs1_daddr_t *)indir)[i];
 			else
 				blkno = ((ufs2_daddr_t *)indir)[i];
 			printblk(fs, lbn + i, blkno, fs->fs_frag, lastlbn);
 		}
 		return;
 	}
 	for (i = 0; i < last; i++) {
 		if (fs->fs_magic == FS_UFS1_MAGIC)
 			blkno = ((ufs1_daddr_t *)indir)[i];
 		else
 			blkno = ((ufs2_daddr_t *)indir)[i];
 		indirprt(fs, level - 1, blksperindir / NINDIR(fs),
 		    lbn + blksperindir * i, blkno, lastlbn);
 	}
 }
 
 static const char *
-distance(fs, lastblk, firstblk)
-	struct fs *fs;
-	ufs2_daddr_t lastblk;
-	ufs2_daddr_t firstblk;
+distance(struct fs *fs, ufs2_daddr_t lastblk, ufs2_daddr_t firstblk)
 {
 	ufs2_daddr_t delta;
 	int firstcg, lastcg;
 	static char buf[100];
 
 	if (lastblk == 0)
 		return ("");
 	delta = firstblk - lastblk - 1;
 	firstcg = dtog(fs, firstblk);
 	lastcg = dtog(fs, lastblk);
 	if (firstcg == lastcg) {
 		snprintf(buf, 100, " distance %jd", (intmax_t)delta);
 		return (&buf[0]);
 	}
 	snprintf(buf, 100, " cg %d blk %jd to cg %d blk %jd",
 	    lastcg, (intmax_t)dtogd(fs, lastblk), firstcg,
 	    (intmax_t)dtogd(fs, firstblk));
 	return (&buf[0]);
 }
 	
 
 static const char *indirname[UFS_NIADDR] = { "First", "Second", "Third" };
 
 static void
-printblk(fs, lbn, blkno, numfrags, lastlbn)
-	struct fs *fs;
-	ufs_lbn_t lbn;
-	ufs2_daddr_t blkno;
-	int numfrags;
-	ufs_lbn_t lastlbn;
+printblk(struct fs *fs, ufs_lbn_t lbn, ufs2_daddr_t blkno, int numfrags,
+	ufs_lbn_t lastlbn)
 {
 	static int seq;
 	static ufs2_daddr_t totfrags, lastindirblk, lastblk, firstblk;
 
 	if (lastlbn <= 0)
 		goto flush;
 	if (seq == 0) {
 		seq = howmany(numfrags, fs->fs_frag);
 		totfrags = numfrags;
 		firstblk = blkno;
 		return;
 	}
 	if (lbn == 0) {
 		seq = howmany(numfrags, fs->fs_frag);
 		totfrags = numfrags;
 		lastblk = 0;
 		firstblk = blkno;
 		lastindirblk = 0;
 		return;
 	}
 	if (lbn < lastlbn && ((firstblk == 0 && blkno == 0) ||
 	    (firstblk == BLK_NOCOPY && blkno == BLK_NOCOPY) ||
 	    (firstblk == BLK_SNAP && blkno == BLK_SNAP) ||
 	    blkno == firstblk + seq * fs->fs_frag)) {
 		seq += howmany(numfrags, fs->fs_frag);
 		totfrags += numfrags;
 		return;
 	}
 flush:
 	if (seq == 0)
 		goto prtindir;
 	if (firstblk <= BLK_SNAP) {
 		if (seq == 1)
 			printf("\tlbn %jd %s\n", (intmax_t)(lbn - seq),
 			    firstblk == 0 ? "hole" :
 			    firstblk == BLK_NOCOPY ? "nocopy" :
 			    "snapblk");
 		else
 			printf("\tlbn %jd-%jd %s\n",
 			    (intmax_t)lbn - seq, (intmax_t)lbn - 1,
 			    firstblk == 0 ? "hole" :
 			    firstblk == BLK_NOCOPY ? "nocopy" :
 			    "snapblk");
 	} else if (seq == 1) {
 		if (totfrags == 1)
 			printf("\tlbn %jd blkno %jd%s\n", (intmax_t)(lbn - seq),
 			   (intmax_t)firstblk, distance(fs, lastblk, firstblk));
 		else
 			printf("\tlbn %jd blkno %jd-%jd%s\n",
 			    (intmax_t)(lbn - seq), (intmax_t)firstblk,
 			    (intmax_t)(firstblk + totfrags - 1),
 			    distance(fs, lastblk, firstblk));
 		lastblk = firstblk + totfrags - 1;
 	} else {
 		printf("\tlbn %jd-%jd blkno %jd-%jd%s\n", (intmax_t)(lbn - seq),
 		    (intmax_t)(lbn - 1), (intmax_t)firstblk,
 		    (intmax_t)(firstblk + totfrags - 1),
 		    distance(fs, lastblk, firstblk));
 		lastblk = firstblk + totfrags - 1;
 	}
 	if (lastlbn > 0 || blkno == 0) {
 		seq = 1;
 		totfrags = numfrags;
 		firstblk = blkno;
 		return;
 	}
 prtindir:
 	if (seq != 0 && (fs->fs_metaspace == 0 || lastindirblk == 0))
 		lastindirblk = lastblk;
 	printf("%s-level indirect, blkno %jd-%jd%s\n", indirname[-lastlbn],
 	    (intmax_t)blkno, (intmax_t)(blkno + numfrags - 1),
 	    distance(fs, lastindirblk, blkno));
 	lastindirblk = blkno + numfrags - 1;
 	if (fs->fs_metaspace == 0)
 		lastblk = lastindirblk;
 	seq = 0;
 }