repair/phase2.c - pub/scm/linux/kernel/git/djwong/xfsprogs-dev - Git at Google

 // SPDX-License-Identifier: GPL-2.0
 /*
  * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc.
  * All Rights Reserved.
  */

 #include "libxfs.h"
 #include "libxlog.h"
 #include "avl.h"
 #include "globals.h"
 #include "agheader.h"
 #include "protos.h"
 #include "err_protos.h"
 #include "incore.h"
 #include "progress.h"
 #include "scan.h"

 /* workaround craziness in the xlog routines */
 int xlog_recover_do_trans(struct xlog *log, struct xlog_recover *t, int p)
 {
 	return 0;
 }

 static void
 zero_log(
 	struct xfs_mount	*mp)
 {
 	int			error;
 	xfs_daddr_t		head_blk;
 	xfs_daddr_t		tail_blk;
 	struct xlog		*log = mp->m_log;

 	xlog_init(mp, mp->m_log);

 	/*
 	 * Find the log head and tail and alert the user to the situation if the
 	 * log appears corrupted or contains data. In either case, we do not
 	 * proceed past this point unless the user explicitly requests to zap
 	 * the log.
 	 */
 	error = xlog_find_tail(log, &head_blk, &tail_blk);
 	if (error) {
 		do_warn(
 		_("zero_log: cannot find log head/tail (xlog_find_tail=%d)\n"),
 			error);
 		if (!no_modify && !zap_log) {
 			do_warn(_(
 "ERROR: The log head and/or tail cannot be discovered. Attempt to mount the\n"
 "filesystem to replay the log or use the -L option to destroy the log and\n"
 "attempt a repair.\n"));
 			exit(2);
 		}
 	} else {
 		if (verbose) {
 			do_log(
 	_("zero_log: head block %" PRId64 " tail block %" PRId64 "\n"),
 				head_blk, tail_blk);
 		}
 		if (head_blk != tail_blk) {
 			if (!no_modify && zap_log) {
 				do_warn(_(
 "ALERT: The filesystem has valuable metadata changes in a log which is being\n"
 "destroyed because the -L option was used.\n"));
 			} else if (no_modify) {
 				do_warn(_(
 "ALERT: The filesystem has valuable metadata changes in a log which is being\n"
 "ignored because the -n option was used.  Expect spurious inconsistencies\n"
 "which may be resolved by first mounting the filesystem to replay the log.\n"));
 			} else {
 				do_warn(_(
 "ERROR: The filesystem has valuable metadata changes in a log which needs to\n"
 "be replayed.  Mount the filesystem to replay the log, and unmount it before\n"
 "re-running xfs_repair.  If you are unable to mount the filesystem, then use\n"
 "the -L option to destroy the log and attempt a repair.\n"
 "Note that destroying the log may cause corruption -- please attempt a mount\n"
 "of the filesystem before doing this.\n"));
 				exit(2);
 			}
 		}
 	}

 	/*
 	 * Only clear the log when explicitly requested. Doing so is unnecessary
 	 * unless something is wrong. Further, this resets the current LSN of
 	 * the filesystem and creates more work for repair of v5 superblock
 	 * filesystems.
 	 */
 	if (!no_modify && zap_log) {
 		libxfs_log_clear(log->l_dev, NULL,
 			XFS_FSB_TO_DADDR(mp, mp->m_sb.sb_logstart),
 			(xfs_extlen_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_logblocks),
 			&mp->m_sb.sb_uuid,
 			xfs_has_logv2(mp) ? 2 : 1,
 			mp->m_sb.sb_logsunit, XLOG_FMT, XLOG_INIT_CYCLE, true);

 		/* update the log data structure with new state */
 		error = xlog_find_tail(log, &head_blk, &tail_blk);
 		if (error || head_blk != tail_blk)
 			do_error(_("failed to clear log"));
 	}

 	/* And we are now magically complete! */
 	PROG_RPT_INC(prog_rpt_done[0], mp->m_sb.sb_logblocks);

 	/*
 	 * Finally, seed the max LSN from the current state of the log if this
 	 * is a v5 filesystem.
 	 */
 	if (xfs_has_crc(mp))
 		libxfs_max_lsn = atomic64_read(&log->l_last_sync_lsn);
 }

 static bool
 set_inobtcount(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	if (!xfs_has_crc(mp)) {
 		printf(
 	_("Inode btree count feature only supported on V5 filesystems.\n"));
 		exit(0);
 	}

 	if (!xfs_has_finobt(mp)) {
 		printf(
 	_("Inode btree count feature requires free inode btree.\n"));
 		exit(0);
 	}

 	if (xfs_has_inobtcounts(mp)) {
 		printf(_("Filesystem already has inode btree counts.\n"));
 		exit(0);
 	}

 	printf(_("Adding inode btree counts to filesystem.\n"));
 	new_sb->sb_features_ro_compat |= XFS_SB_FEAT_RO_COMPAT_INOBTCNT;
 	new_sb->sb_features_incompat |= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
 	return true;
 }

 static bool
 set_bigtime(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	if (!xfs_has_crc(mp)) {
 		printf(
 	_("Large timestamp feature only supported on V5 filesystems.\n"));
 		exit(0);
 	}

 	if (xfs_has_bigtime(mp)) {
 		printf(_("Filesystem already supports large timestamps.\n"));
 		exit(0);
 	}

 	printf(_("Adding large timestamp support to filesystem.\n"));
 	new_sb->sb_features_incompat |= (XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR |
 					 XFS_SB_FEAT_INCOMPAT_BIGTIME);
 	return true;
 }

 static bool
 set_nrext64(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	if (!xfs_has_crc(mp)) {
 		printf(
 	_("Nrext64 only supported on V5 filesystems.\n"));
 		exit(0);
 	}

 	if (xfs_has_large_extent_counts(mp)) {
 		printf(_("Filesystem already supports nrext64.\n"));
 		exit(0);
 	}

 	printf(_("Adding nrext64 to filesystem.\n"));
 	new_sb->sb_features_incompat |= XFS_SB_FEAT_INCOMPAT_NREXT64;
 	new_sb->sb_features_incompat |= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
 	return true;
 }

 static bool
 set_exchrange(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	if (xfs_has_exchange_range(mp)) {
 		printf(_("Filesystem already supports exchange-range.\n"));
 		exit(0);
 	}

 	if (!xfs_has_crc(mp)) {
 		printf(
 	_("File exchange-range feature only supported on V5 filesystems.\n"));
 		exit(0);
 	}

 	if (!xfs_has_reflink(mp)) {
 		printf(
 	_("File exchange-range feature cannot be added without reflink.\n"));
 		exit(0);
 	}

 	printf(_("Adding file exchange-range support to filesystem.\n"));
 	new_sb->sb_features_incompat |= XFS_SB_FEAT_INCOMPAT_EXCHRANGE;
 	new_sb->sb_features_incompat |= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
 	return true;
 }

 struct check_state {
 	struct xfs_sb		sb;
 	uint64_t		features;
 	bool			finobt_nores;
 };

 static inline void
 capture_old_state(
 	struct check_state	*old_state,
 	const struct xfs_mount	*mp)
 {
 	memcpy(&old_state->sb, &mp->m_sb, sizeof(struct xfs_sb));
 	old_state->finobt_nores = mp->m_finobt_nores;
 	old_state->features = mp->m_features;
 }

 static inline void
 restore_old_state(
 	struct xfs_mount		*mp,
 	const struct check_state	*old_state)
 {
 	memcpy(&mp->m_sb, &old_state->sb, sizeof(struct xfs_sb));
 	mp->m_finobt_nores = old_state->finobt_nores;
 	mp->m_features = old_state->features;
 	libxfs_compute_all_maxlevels(mp);
 	libxfs_trans_init(mp);
 }

 static inline void
 install_new_state(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	memcpy(&mp->m_sb, new_sb, sizeof(struct xfs_sb));
 	mp->m_features |= libxfs_sb_version_to_features(new_sb);
 	libxfs_compute_all_maxlevels(mp);
 	libxfs_trans_init(mp);
 }

 #define GIGABYTES(count, blog)     ((uint64_t)(count) << (30 - (blog)))
 static inline bool
 check_free_space(
 	struct xfs_mount	*mp,
 	unsigned long long	avail,
 	unsigned long long	total)
 {
 	/* Ok if there's more than 10% free. */
 	if (avail >= total / 10)
 		return true;

 	/* Not ok if there's less than 5% free. */
 	if (avail < total / 5)
 		return false;

 	/* Let it slide if there's at least 10GB free. */
 	return avail > GIGABYTES(10, mp->m_sb.sb_blocklog);
 }

 static void
 check_fs_free_space(
 	struct xfs_mount		*mp,
 	const struct check_state	*old,
 	struct xfs_sb			*new_sb)
 {
 	struct xfs_perag		*pag = NULL;
 	int				error;

 	/* Make sure we have enough space for per-AG reservations. */
 	while ((pag = xfs_perag_next(mp, pag))) {
 		struct xfs_trans	*tp;
 		struct xfs_agf		*agf;
 		struct xfs_buf		*agi_bp, *agf_bp;
 		unsigned int		avail, agblocks;

 		/* Put back the old super so that we can read AG headers. */
 		restore_old_state(mp, old);

 		/*
 		 * Create a dummy transaction so that we can load the AGI and
 		 * AGF buffers in memory with the old fs geometry and pin them
 		 * there while we try to make a per-AG reservation with the new
 		 * geometry.
 		 */
 		error = -libxfs_trans_alloc_empty(mp, &tp);
 		if (error)
 			do_error(
 	_("Cannot reserve resources for upgrade check, err=%d.\n"),
 					error);

 		error = -libxfs_ialloc_read_agi(pag, tp, 0, &agi_bp);
 		if (error)
 			do_error(
 	_("Cannot read AGI %u for upgrade check, err=%d.\n"),
 					pag_agno(pag), error);

 		error = -libxfs_alloc_read_agf(pag, tp, 0, &agf_bp);
 		if (error)
 			do_error(
 	_("Cannot read AGF %u for upgrade check, err=%d.\n"),
 					pag_agno(pag), error);
 		agf = agf_bp->b_addr;
 		agblocks = be32_to_cpu(agf->agf_length);

 		/*
 		 * Install the new superblock and try to make a per-AG space
 		 * reservation with the new geometry.  We pinned the AG header
 		 * buffers to the transaction, so we shouldn't hit any
 		 * corruption errors on account of the new geometry.
 		 */
 		install_new_state(mp, new_sb);

 		error = -libxfs_ag_resv_init(pag, tp);
 		if (error == ENOSPC) {
 			printf(
 	_("Not enough free space would remain in AG %u for metadata.\n"),
 					pag_agno(pag));
 			exit(1);
 		}
 		if (error)
 			do_error(
 	_("Error %d while checking AG %u space reservation.\n"),
 					error, pag_agno(pag));

 		/*
 		 * Would the post-upgrade filesystem have enough free space in
 		 * this AG after making per-AG reservations?
 		 */
 		avail = pag->pagf_freeblks + pag->pagf_flcount;
 		avail -= pag->pag_meta_resv.ar_reserved;
 		avail -= pag->pag_rmapbt_resv.ar_asked;

 		if (!check_free_space(mp, avail, agblocks)) {
 			printf(
 	_("AG %u will be low on space after upgrade.\n"),
 					pag_agno(pag));
 			exit(1);
 		}
 		libxfs_trans_cancel(tp);
 	}

 	/*
 	 * Would the post-upgrade filesystem have enough free space on the data
 	 * device after making per-AG reservations?
 	 */
 	if (!check_free_space(mp, mp->m_sb.sb_fdblocks, mp->m_sb.sb_dblocks)) {
 		printf(_("Filesystem will be low on space after upgrade.\n"));
 		exit(1);
 	}

 	/*
 	 * Release the per-AG reservations and mark the per-AG structure as
 	 * uninitialized so that we don't trip over stale cached counters
 	 * after the upgrade/
 	 */
 	while ((pag = xfs_perag_next(mp, pag))) {
 		libxfs_ag_resv_free(pag);
 		clear_bit(XFS_AGSTATE_AGF_INIT, &pag->pag_opstate);
 		clear_bit(XFS_AGSTATE_AGI_INIT, &pag->pag_opstate);
 	}
 }

 static bool
 need_check_fs_free_space(
 	struct xfs_mount		*mp,
 	const struct check_state	*old)
 {
 	return false;
 }

 /*
  * Make sure we can actually upgrade this (v5) filesystem without running afoul
  * of root inode or log size requirements that would prevent us from mounting
  * the filesystem.  If everything checks out, commit the new geometry.
  */
 static void
 install_new_geometry(
 	struct xfs_mount	*mp,
 	struct xfs_sb		*new_sb)
 {
 	struct check_state	old;
 	xfs_ino_t		rootino;
 	int			min_logblocks;

 	capture_old_state(&old, mp);
 	install_new_state(mp, new_sb);

 	/*
 	 * The existing log must be large enough to satisfy the new minimum log
 	 * size requirements.
 	 */
 	min_logblocks = libxfs_log_calc_minimum_size(mp);
 	if (old.sb.sb_logblocks < min_logblocks) {
 		printf(
 	_("Filesystem log too small to upgrade filesystem; need %u blocks, have %u.\n"),
 				min_logblocks, old.sb.sb_logblocks);
 		exit(1);
 	}

 	/*
 	 * The root inode must be where xfs_repair will expect it to be with
 	 * the new geometry.
 	 */
 	rootino = libxfs_ialloc_calc_rootino(mp, new_sb->sb_unit);
 	if (old.sb.sb_rootino != rootino) {
 		printf(
 	_("Cannot upgrade filesystem, root inode (%llu) cannot be moved to %llu.\n"),
 				(unsigned long long)old.sb.sb_rootino,
 				(unsigned long long)rootino);
 		exit(1);
 	}

 	if (need_check_fs_free_space(mp, &old))
 		check_fs_free_space(mp, &old, new_sb);

 	/*
 	 * Restore the old state to get everything back to a clean state,
 	 * upgrade the featureset one more time, and recompute the btree max
 	 * levels for this filesystem.
 	 */
 	restore_old_state(mp, &old);
 	install_new_state(mp, new_sb);
 }

 /* Perform the user's requested upgrades on filesystem. */
 static void
 upgrade_filesystem(
 	struct xfs_mount	*mp)
 {
 	struct xfs_sb		new_sb;
 	struct xfs_buf		*bp;
 	bool			dirty = false;
 	int			error;

 	memcpy(&new_sb, &mp->m_sb, sizeof(struct xfs_sb));

 	if (add_inobtcount)
 		dirty |= set_inobtcount(mp, &new_sb);
 	if (add_bigtime)
 		dirty |= set_bigtime(mp, &new_sb);
 	if (add_nrext64)
 		dirty |= set_nrext64(mp, &new_sb);
 	if (add_exchrange)
 		dirty |= set_exchrange(mp, &new_sb);
 	if (!dirty)
 		return;

 	install_new_geometry(mp, &new_sb);
 	if (no_modify)
 		return;

 	bp = libxfs_getsb(mp);
 	if (!bp || bp->b_error)
 		do_error(
 	_("couldn't get superblock for feature upgrade, err=%d\n"),
 				bp ? bp->b_error : ENOMEM);

 	libxfs_sb_to_disk(bp->b_addr, &mp->m_sb);

 	/*
 	 * Write the primary super to disk immediately so that needsrepair will
 	 * be set if repair doesn't complete.
 	 */
 	error = -libxfs_bwrite(bp);
 	if (error)
 		do_error(
 	_("filesystem feature upgrade failed, err=%d\n"),
 				error);

 	libxfs_buf_relse(bp);
 	features_changed = true;
 }

 /*
  * ok, at this point, the fs is mounted but the root inode may be
  * trashed and the ag headers haven't been checked.  So we have
  * a valid xfs_mount_t and superblock but that's about it.  That
  * means we can use macros that use mount/sb fields in calculations
  * but I/O or btree routines that depend on space maps or inode maps
  * being correct are verboten.
  */

 void
 phase2(
 	struct xfs_mount	*mp,
 	int			scan_threads)
 {
 	ino_tree_node_t		*ino_rec;
 	unsigned int		inuse = xfs_rootrec_inodes_inuse(mp), j;

 	/* now we can start using the buffer cache routines */
 	set_mp(mp);

 	/* Check whether this fs has internal or external log */
 	if (mp->m_sb.sb_logstart == 0) {
 		if (!x.log.name)
 			do_error(_("This filesystem has an external log.  "
 				   "Specify log device with the -l option.\n"));

 		do_log(_("Phase 2 - using external log on %s\n"), x.log.name);
 	} else
 		do_log(_("Phase 2 - using internal log\n"));

 	/*
 	 * Now that we've set up the buffer cache the way we want it, try to
 	 * grab our own reference to the primary sb so that the hooks will not
 	 * have to call out to the buffer cache.
 	 */
 	if (mp->m_buf_writeback_fn)
 		retain_primary_sb(mp);

 	/* Zero log if applicable */
 	do_log(_("        - zero log...\n"));

 	set_progress_msg(PROG_FMT_ZERO_LOG, (uint64_t)mp->m_sb.sb_logblocks);
 	zero_log(mp);
 	print_final_rpt();

 	do_log(_("        - scan filesystem freespace and inode maps...\n"));

 	bad_ino_btree = 0;

 	set_progress_msg(PROG_FMT_SCAN_AG, (uint64_t) glob_agcount);

 	scan_ags(mp, scan_threads);

 	print_final_rpt();

 	/*
 	 * make sure we know about the root inode chunk
 	 */
 	if ((ino_rec = find_inode_rec(mp, 0, mp->m_sb.sb_rootino)) == NULL)  {
 		struct xfs_sb	*sb = &mp->m_sb;

 		if (xfs_has_metadir(mp))
 			ASSERT(sb->sb_metadirino == sb->sb_rootino + 1 &&
 			       sb->sb_rbmino  == sb->sb_rootino + 2 &&
 			       sb->sb_rsumino == sb->sb_rootino + 3);
 		else
 			ASSERT(sb->sb_rbmino  == sb->sb_rootino + 1 &&
 			       sb->sb_rsumino == sb->sb_rootino + 2);
 		do_warn(_("root inode chunk not found\n"));

 		/*
 		 * mark the first 3-4 inodes used, the rest are free
 		 */
 		ino_rec = set_inode_used_alloc(mp, 0,
 				XFS_INO_TO_AGINO(mp, sb->sb_rootino));
 		for (j = 1; j < inuse; j++) {
 			set_inode_used(ino_rec, j);
 			set_inode_is_meta(ino_rec, j);
 		}

 		for (j = inuse; j < XFS_INODES_PER_CHUNK; j++)
 			set_inode_free(ino_rec, j);

 		/*
 		 * also mark blocks
 		 */
 		set_bmap_ext(0, XFS_INO_TO_AGBNO(mp, sb->sb_rootino),
 			     M_IGEO(mp)->ialloc_blks, XR_E_INO);
 	} else  {
 		do_log(_("        - found root inode chunk\n"));
 		j = 0;

 		/*
 		 * blocks are marked, just make sure they're in use
 		 */
 		if (is_inode_free(ino_rec, j)) {
 			do_warn(_("root inode marked free, "));
 			set_inode_used(ino_rec, j);
 			if (!no_modify)
 				do_warn(_("correcting\n"));
 			else
 				do_warn(_("would correct\n"));
 		}
 		j++;

 		if (xfs_has_metadir(mp)) {
 			if (is_inode_free(ino_rec, j))  {
 				do_warn(_("metadata root inode marked free, "));
 				set_inode_used(ino_rec, j);
 				if (!no_modify)
 					do_warn(_("correcting\n"));
 				else
 					do_warn(_("would correct\n"));
 			}
 			set_inode_is_meta(ino_rec, j);
 			j++;
 		}

 		if (is_inode_free(ino_rec, j))  {
 			do_warn(_("realtime bitmap inode marked free, "));
 			set_inode_used(ino_rec, j);
 			if (!no_modify)
 				do_warn(_("correcting\n"));
 			else
 				do_warn(_("would correct\n"));
 		}
 		set_inode_is_meta(ino_rec, j);
 		j++;

 		if (is_inode_free(ino_rec, j))  {
 			do_warn(_("realtime summary inode marked free, "));
 			set_inode_used(ino_rec, j);
 			if (!no_modify)
 				do_warn(_("correcting\n"));
 			else
 				do_warn(_("would correct\n"));
 		}
 		set_inode_is_meta(ino_rec, j);
 		j++;
 	}

 	/*
 	 * Upgrade the filesystem now that we've done a preliminary check of
 	 * the superblocks, the AGs, the log, and the metadata inodes.
 	 */
 	upgrade_filesystem(mp);
 }
	// SPDX-License-Identifier: GPL-2.0
	/*
	* Copyright (c) 2000-2002,2005 Silicon Graphics, Inc.
	* All Rights Reserved.
	*/

	#include "libxfs.h"
	#include "libxlog.h"
	#include "avl.h"
	#include "globals.h"
	#include "agheader.h"
	#include "protos.h"
	#include "err_protos.h"
	#include "incore.h"
	#include "progress.h"
	#include "scan.h"

	/* workaround craziness in the xlog routines */
	int xlog_recover_do_trans(struct xlog log, struct xlog_recover t, int p)
	{
	return 0;
	}

	static void
	zero_log(
	struct xfs_mount *mp)
	{
	int error;
	xfs_daddr_t head_blk;
	xfs_daddr_t tail_blk;
	struct xlog *log = mp->m_log;

	xlog_init(mp, mp->m_log);

	/*
	* Find the log head and tail and alert the user to the situation if the
	* log appears corrupted or contains data. In either case, we do not
	* proceed past this point unless the user explicitly requests to zap
	* the log.
	*/
	error = xlog_find_tail(log, &head_blk, &tail_blk);
	if (error) {
	do_warn(
	_("zero_log: cannot find log head/tail (xlog_find_tail=%d)\n"),
	error);
	if (!no_modify && !zap_log) {
	do_warn(_(
	"ERROR: The log head and/or tail cannot be discovered. Attempt to mount the\n"
	"filesystem to replay the log or use the -L option to destroy the log and\n"
	"attempt a repair.\n"));
	exit(2);
	}
	} else {
	if (verbose) {
	do_log(
	_("zero_log: head block %" PRId64 " tail block %" PRId64 "\n"),
	head_blk, tail_blk);
	}
	if (head_blk != tail_blk) {
	if (!no_modify && zap_log) {
	do_warn(_(
	"ALERT: The filesystem has valuable metadata changes in a log which is being\n"
	"destroyed because the -L option was used.\n"));
	} else if (no_modify) {
	do_warn(_(
	"ALERT: The filesystem has valuable metadata changes in a log which is being\n"
	"ignored because the -n option was used. Expect spurious inconsistencies\n"
	"which may be resolved by first mounting the filesystem to replay the log.\n"));
	} else {
	do_warn(_(
	"ERROR: The filesystem has valuable metadata changes in a log which needs to\n"
	"be replayed. Mount the filesystem to replay the log, and unmount it before\n"
	"re-running xfs_repair. If you are unable to mount the filesystem, then use\n"
	"the -L option to destroy the log and attempt a repair.\n"
	"Note that destroying the log may cause corruption -- please attempt a mount\n"
	"of the filesystem before doing this.\n"));
	exit(2);
	}
	}
	}

	/*
	* Only clear the log when explicitly requested. Doing so is unnecessary
	* unless something is wrong. Further, this resets the current LSN of
	* the filesystem and creates more work for repair of v5 superblock
	* filesystems.
	*/
	if (!no_modify && zap_log) {
	libxfs_log_clear(log->l_dev, NULL,
	XFS_FSB_TO_DADDR(mp, mp->m_sb.sb_logstart),
	(xfs_extlen_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_logblocks),
	&mp->m_sb.sb_uuid,
	xfs_has_logv2(mp) ? 2 : 1,
	mp->m_sb.sb_logsunit, XLOG_FMT, XLOG_INIT_CYCLE, true);

	/* update the log data structure with new state */
	error = xlog_find_tail(log, &head_blk, &tail_blk);
	if (error \|\| head_blk != tail_blk)
	do_error(_("failed to clear log"));
	}

	/* And we are now magically complete! */
	PROG_RPT_INC(prog_rpt_done[0], mp->m_sb.sb_logblocks);

	/*
	* Finally, seed the max LSN from the current state of the log if this
	* is a v5 filesystem.
	*/
	if (xfs_has_crc(mp))
	libxfs_max_lsn = atomic64_read(&log->l_last_sync_lsn);
	}

	static bool
	set_inobtcount(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	if (!xfs_has_crc(mp)) {
	printf(
	_("Inode btree count feature only supported on V5 filesystems.\n"));
	exit(0);
	}

	if (!xfs_has_finobt(mp)) {
	printf(
	_("Inode btree count feature requires free inode btree.\n"));
	exit(0);
	}

	if (xfs_has_inobtcounts(mp)) {
	printf(_("Filesystem already has inode btree counts.\n"));
	exit(0);
	}

	printf(_("Adding inode btree counts to filesystem.\n"));
	new_sb->sb_features_ro_compat \|= XFS_SB_FEAT_RO_COMPAT_INOBTCNT;
	new_sb->sb_features_incompat \|= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
	return true;
	}

	static bool
	set_bigtime(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	if (!xfs_has_crc(mp)) {
	printf(
	_("Large timestamp feature only supported on V5 filesystems.\n"));
	exit(0);
	}

	if (xfs_has_bigtime(mp)) {
	printf(_("Filesystem already supports large timestamps.\n"));
	exit(0);
	}

	printf(_("Adding large timestamp support to filesystem.\n"));
	new_sb->sb_features_incompat \|= (XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR \|
	XFS_SB_FEAT_INCOMPAT_BIGTIME);
	return true;
	}

	static bool
	set_nrext64(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	if (!xfs_has_crc(mp)) {
	printf(
	_("Nrext64 only supported on V5 filesystems.\n"));
	exit(0);
	}

	if (xfs_has_large_extent_counts(mp)) {
	printf(_("Filesystem already supports nrext64.\n"));
	exit(0);
	}

	printf(_("Adding nrext64 to filesystem.\n"));
	new_sb->sb_features_incompat \|= XFS_SB_FEAT_INCOMPAT_NREXT64;
	new_sb->sb_features_incompat \|= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
	return true;
	}

	static bool
	set_exchrange(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	if (xfs_has_exchange_range(mp)) {
	printf(_("Filesystem already supports exchange-range.\n"));
	exit(0);
	}

	if (!xfs_has_crc(mp)) {
	printf(
	_("File exchange-range feature only supported on V5 filesystems.\n"));
	exit(0);
	}

	if (!xfs_has_reflink(mp)) {
	printf(
	_("File exchange-range feature cannot be added without reflink.\n"));
	exit(0);
	}

	printf(_("Adding file exchange-range support to filesystem.\n"));
	new_sb->sb_features_incompat \|= XFS_SB_FEAT_INCOMPAT_EXCHRANGE;
	new_sb->sb_features_incompat \|= XFS_SB_FEAT_INCOMPAT_NEEDSREPAIR;
	return true;
	}

	struct check_state {
	struct xfs_sb sb;
	uint64_t features;
	bool finobt_nores;
	};

	static inline void
	capture_old_state(
	struct check_state *old_state,
	const struct xfs_mount *mp)
	{
	memcpy(&old_state->sb, &mp->m_sb, sizeof(struct xfs_sb));
	old_state->finobt_nores = mp->m_finobt_nores;
	old_state->features = mp->m_features;
	}

	static inline void
	restore_old_state(
	struct xfs_mount *mp,
	const struct check_state *old_state)
	{
	memcpy(&mp->m_sb, &old_state->sb, sizeof(struct xfs_sb));
	mp->m_finobt_nores = old_state->finobt_nores;
	mp->m_features = old_state->features;
	libxfs_compute_all_maxlevels(mp);
	libxfs_trans_init(mp);
	}

	static inline void
	install_new_state(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	memcpy(&mp->m_sb, new_sb, sizeof(struct xfs_sb));
	mp->m_features \|= libxfs_sb_version_to_features(new_sb);
	libxfs_compute_all_maxlevels(mp);
	libxfs_trans_init(mp);
	}

	#define GIGABYTES(count, blog) ((uint64_t)(count) << (30 - (blog)))
	static inline bool
	check_free_space(
	struct xfs_mount *mp,
	unsigned long long avail,
	unsigned long long total)
	{
	/* Ok if there's more than 10% free. */
	if (avail >= total / 10)
	return true;

	/* Not ok if there's less than 5% free. */
	if (avail < total / 5)
	return false;

	/* Let it slide if there's at least 10GB free. */
	return avail > GIGABYTES(10, mp->m_sb.sb_blocklog);
	}

	static void
	check_fs_free_space(
	struct xfs_mount *mp,
	const struct check_state *old,
	struct xfs_sb *new_sb)
	{
	struct xfs_perag *pag = NULL;
	int error;

	/* Make sure we have enough space for per-AG reservations. */
	while ((pag = xfs_perag_next(mp, pag))) {
	struct xfs_trans *tp;
	struct xfs_agf *agf;
	struct xfs_buf agi_bp, agf_bp;
	unsigned int avail, agblocks;

	/* Put back the old super so that we can read AG headers. */
	restore_old_state(mp, old);

	/*
	* Create a dummy transaction so that we can load the AGI and
	* AGF buffers in memory with the old fs geometry and pin them
	* there while we try to make a per-AG reservation with the new
	* geometry.
	*/
	error = -libxfs_trans_alloc_empty(mp, &tp);
	if (error)
	do_error(
	_("Cannot reserve resources for upgrade check, err=%d.\n"),
	error);

	error = -libxfs_ialloc_read_agi(pag, tp, 0, &agi_bp);
	if (error)
	do_error(
	_("Cannot read AGI %u for upgrade check, err=%d.\n"),
	pag_agno(pag), error);

	error = -libxfs_alloc_read_agf(pag, tp, 0, &agf_bp);
	if (error)
	do_error(
	_("Cannot read AGF %u for upgrade check, err=%d.\n"),
	pag_agno(pag), error);
	agf = agf_bp->b_addr;
	agblocks = be32_to_cpu(agf->agf_length);

	/*
	* Install the new superblock and try to make a per-AG space
	* reservation with the new geometry. We pinned the AG header
	* buffers to the transaction, so we shouldn't hit any
	* corruption errors on account of the new geometry.
	*/
	install_new_state(mp, new_sb);

	error = -libxfs_ag_resv_init(pag, tp);
	if (error == ENOSPC) {
	printf(
	_("Not enough free space would remain in AG %u for metadata.\n"),
	pag_agno(pag));
	exit(1);
	}
	if (error)
	do_error(
	_("Error %d while checking AG %u space reservation.\n"),
	error, pag_agno(pag));

	/*
	* Would the post-upgrade filesystem have enough free space in
	* this AG after making per-AG reservations?
	*/
	avail = pag->pagf_freeblks + pag->pagf_flcount;
	avail -= pag->pag_meta_resv.ar_reserved;
	avail -= pag->pag_rmapbt_resv.ar_asked;

	if (!check_free_space(mp, avail, agblocks)) {
	printf(
	_("AG %u will be low on space after upgrade.\n"),
	pag_agno(pag));
	exit(1);
	}
	libxfs_trans_cancel(tp);
	}

	/*
	* Would the post-upgrade filesystem have enough free space on the data
	* device after making per-AG reservations?
	*/
	if (!check_free_space(mp, mp->m_sb.sb_fdblocks, mp->m_sb.sb_dblocks)) {
	printf(_("Filesystem will be low on space after upgrade.\n"));
	exit(1);
	}

	/*
	* Release the per-AG reservations and mark the per-AG structure as
	* uninitialized so that we don't trip over stale cached counters
	* after the upgrade/
	*/
	while ((pag = xfs_perag_next(mp, pag))) {
	libxfs_ag_resv_free(pag);
	clear_bit(XFS_AGSTATE_AGF_INIT, &pag->pag_opstate);
	clear_bit(XFS_AGSTATE_AGI_INIT, &pag->pag_opstate);
	}
	}

	static bool
	need_check_fs_free_space(
	struct xfs_mount *mp,
	const struct check_state *old)
	{
	return false;
	}

	/*
	* Make sure we can actually upgrade this (v5) filesystem without running afoul
	* of root inode or log size requirements that would prevent us from mounting
	* the filesystem. If everything checks out, commit the new geometry.
	*/
	static void
	install_new_geometry(
	struct xfs_mount *mp,
	struct xfs_sb *new_sb)
	{
	struct check_state old;
	xfs_ino_t rootino;
	int min_logblocks;

	capture_old_state(&old, mp);
	install_new_state(mp, new_sb);

	/*
	* The existing log must be large enough to satisfy the new minimum log
	* size requirements.
	*/
	min_logblocks = libxfs_log_calc_minimum_size(mp);
	if (old.sb.sb_logblocks < min_logblocks) {
	printf(
	_("Filesystem log too small to upgrade filesystem; need %u blocks, have %u.\n"),
	min_logblocks, old.sb.sb_logblocks);
	exit(1);
	}

	/*
	* The root inode must be where xfs_repair will expect it to be with
	* the new geometry.
	*/
	rootino = libxfs_ialloc_calc_rootino(mp, new_sb->sb_unit);
	if (old.sb.sb_rootino != rootino) {
	printf(
	_("Cannot upgrade filesystem, root inode (%llu) cannot be moved to %llu.\n"),
	(unsigned long long)old.sb.sb_rootino,
	(unsigned long long)rootino);
	exit(1);
	}

	if (need_check_fs_free_space(mp, &old))
	check_fs_free_space(mp, &old, new_sb);

	/*
	* Restore the old state to get everything back to a clean state,
	* upgrade the featureset one more time, and recompute the btree max
	* levels for this filesystem.
	*/
	restore_old_state(mp, &old);
	install_new_state(mp, new_sb);
	}

	/* Perform the user's requested upgrades on filesystem. */
	static void
	upgrade_filesystem(
	struct xfs_mount *mp)
	{
	struct xfs_sb new_sb;
	struct xfs_buf *bp;
	bool dirty = false;
	int error;

	memcpy(&new_sb, &mp->m_sb, sizeof(struct xfs_sb));

	if (add_inobtcount)
	dirty \|= set_inobtcount(mp, &new_sb);
	if (add_bigtime)
	dirty \|= set_bigtime(mp, &new_sb);
	if (add_nrext64)
	dirty \|= set_nrext64(mp, &new_sb);
	if (add_exchrange)
	dirty \|= set_exchrange(mp, &new_sb);
	if (!dirty)
	return;

	install_new_geometry(mp, &new_sb);
	if (no_modify)
	return;

	bp = libxfs_getsb(mp);
	if (!bp \|\| bp->b_error)
	do_error(
	_("couldn't get superblock for feature upgrade, err=%d\n"),
	bp ? bp->b_error : ENOMEM);

	libxfs_sb_to_disk(bp->b_addr, &mp->m_sb);

	/*
	* Write the primary super to disk immediately so that needsrepair will
	* be set if repair doesn't complete.
	*/
	error = -libxfs_bwrite(bp);
	if (error)
	do_error(
	_("filesystem feature upgrade failed, err=%d\n"),
	error);

	libxfs_buf_relse(bp);
	features_changed = true;
	}

	/*
	* ok, at this point, the fs is mounted but the root inode may be
	* trashed and the ag headers haven't been checked. So we have
	* a valid xfs_mount_t and superblock but that's about it. That
	* means we can use macros that use mount/sb fields in calculations
	* but I/O or btree routines that depend on space maps or inode maps
	* being correct are verboten.
	*/

	void
	phase2(
	struct xfs_mount *mp,
	int scan_threads)
	{
	ino_tree_node_t *ino_rec;
	unsigned int inuse = xfs_rootrec_inodes_inuse(mp), j;

	/* now we can start using the buffer cache routines */
	set_mp(mp);

	/* Check whether this fs has internal or external log */
	if (mp->m_sb.sb_logstart == 0) {
	if (!x.log.name)
	do_error(_("This filesystem has an external log. "
	"Specify log device with the -l option.\n"));

	do_log(_("Phase 2 - using external log on %s\n"), x.log.name);
	} else
	do_log(_("Phase 2 - using internal log\n"));

	/*
	* Now that we've set up the buffer cache the way we want it, try to
	* grab our own reference to the primary sb so that the hooks will not
	* have to call out to the buffer cache.
	*/
	if (mp->m_buf_writeback_fn)
	retain_primary_sb(mp);

	/* Zero log if applicable */
	do_log(_(" - zero log...\n"));

	set_progress_msg(PROG_FMT_ZERO_LOG, (uint64_t)mp->m_sb.sb_logblocks);
	zero_log(mp);
	print_final_rpt();

	do_log(_(" - scan filesystem freespace and inode maps...\n"));

	bad_ino_btree = 0;

	set_progress_msg(PROG_FMT_SCAN_AG, (uint64_t) glob_agcount);

	scan_ags(mp, scan_threads);

	print_final_rpt();

	/*
	* make sure we know about the root inode chunk
	*/
	if ((ino_rec = find_inode_rec(mp, 0, mp->m_sb.sb_rootino)) == NULL) {
	struct xfs_sb *sb = &mp->m_sb;

	if (xfs_has_metadir(mp))
	ASSERT(sb->sb_metadirino == sb->sb_rootino + 1 &&
	sb->sb_rbmino == sb->sb_rootino + 2 &&
	sb->sb_rsumino == sb->sb_rootino + 3);
	else
	ASSERT(sb->sb_rbmino == sb->sb_rootino + 1 &&
	sb->sb_rsumino == sb->sb_rootino + 2);
	do_warn(_("root inode chunk not found\n"));

	/*
	* mark the first 3-4 inodes used, the rest are free
	*/
	ino_rec = set_inode_used_alloc(mp, 0,
	XFS_INO_TO_AGINO(mp, sb->sb_rootino));
	for (j = 1; j < inuse; j++) {
	set_inode_used(ino_rec, j);
	set_inode_is_meta(ino_rec, j);
	}

	for (j = inuse; j < XFS_INODES_PER_CHUNK; j++)
	set_inode_free(ino_rec, j);

	/*
	* also mark blocks
	*/
	set_bmap_ext(0, XFS_INO_TO_AGBNO(mp, sb->sb_rootino),
	M_IGEO(mp)->ialloc_blks, XR_E_INO);
	} else {
	do_log(_(" - found root inode chunk\n"));
	j = 0;

	/*
	* blocks are marked, just make sure they're in use
	*/
	if (is_inode_free(ino_rec, j)) {
	do_warn(_("root inode marked free, "));
	set_inode_used(ino_rec, j);
	if (!no_modify)
	do_warn(_("correcting\n"));
	else
	do_warn(_("would correct\n"));
	}
	j++;

	if (xfs_has_metadir(mp)) {
	if (is_inode_free(ino_rec, j)) {
	do_warn(_("metadata root inode marked free, "));
	set_inode_used(ino_rec, j);
	if (!no_modify)
	do_warn(_("correcting\n"));
	else
	do_warn(_("would correct\n"));
	}
	set_inode_is_meta(ino_rec, j);
	j++;
	}

	if (is_inode_free(ino_rec, j)) {
	do_warn(_("realtime bitmap inode marked free, "));
	set_inode_used(ino_rec, j);
	if (!no_modify)
	do_warn(_("correcting\n"));
	else
	do_warn(_("would correct\n"));
	}
	set_inode_is_meta(ino_rec, j);
	j++;

	if (is_inode_free(ino_rec, j)) {
	do_warn(_("realtime summary inode marked free, "));
	set_inode_used(ino_rec, j);
	if (!no_modify)
	do_warn(_("correcting\n"));
	else
	do_warn(_("would correct\n"));
	}
	set_inode_is_meta(ino_rec, j);
	j++;
	}

	/*
	* Upgrade the filesystem now that we've done a preliminary check of
	* the superblocks, the AGs, the log, and the metadata inodes.
	*/
	upgrade_filesystem(mp);
	}