tests/xfs/057 - pub/scm/linux/kernel/git/dgc/xfstests-dev - Git at Google

 #! /bin/bash
 # FS QA Test No. 057
 #
 # Attempt to reproduce log recovery failure by writing corrupt log records over
 # the last good tail in the log. The tail is force pinned while a workload runs
 # the head as close as possible behind the tail. Once the head is pinned,
 # corrupted log records are written to the log and the filesystem shuts down.
 #
 # While log recovery should handle the corrupted log records, it has historical
 # problems dealing with the situation where the corrupted log records may have
 # overwritten the tail of the previous good record in the log. If this occurs,
 # log recovery may fail.
 #
 # This can be reproduced more reliably under non-default conditions such as with
 # the smallest supported FSB sizes and/or largest supported log buffer sizes and
 # counts (logbufs and logbsize mount options).
 #
 # Note that this test requires a DEBUG mode kernel.
 #
 #-----------------------------------------------------------------------
 # Copyright (c) 2017 Red Hat, Inc. All Rights Reserved.
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License as
 # published by the Free Software Foundation.
 #
 # This program is distributed in the hope that it would be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU General Public License for more details.
 #
 # You should have received a copy of the GNU General Public License
 # along with this program; if not, write the Free Software Foundation,
 # Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 #-----------------------------------------------------------------------
 #

 seq=`basename $0`
 seqres=$RESULT_DIR/$seq
 echo "QA output created by $seq"

 here=`pwd`
 tmp=/tmp/$$
 status=1	# failure is the default!
 trap "_cleanup; exit \$status" 0 1 2 3 15

 _cleanup()
 {
 	cd /
 	rm -f $tmp.*
 	$KILLALL_PROG -9 fsstress > /dev/null 2>&1
 	[ -e /sys/fs/xfs/$sdev/errortag/log_item_pin ] &&
 		echo 0 > /sys/fs/xfs/$sdev/errortag/log_item_pin
 	wait > /dev/null 2>&1
 }

 rm -f $seqres.full

 # get standard environment, filters and checks
 . ./common/rc
 . ./common/inject

 # real QA test starts here

 # Modify as appropriate.
 _supported_fs xfs
 _supported_os Linux
 _require_xfs_io_error_injection log_item_pin
 _require_xfs_io_error_injection log_bad_crc
 _require_scratch
 _require_command "$KILLALL_PROG" killall

 echo "Silence is golden."

 sdev=$(_short_dev $SCRATCH_DEV)

 # use a small log fs
 _scratch_mkfs_sized $((1024 * 1024 * 500)) >> $seqres.full 2>&1 ||
 		_fail "mkfs failed"
 _scratch_mount

 # populate the fs with some data and cycle the mount to reset the log head/tail
 $FSSTRESS_PROG -d $SCRATCH_MNT -z -fcreat=1 -p 4 -n 100000 > /dev/null 2>&1
 _scratch_cycle_mount || _fail "cycle mount failed"

 # Pin the tail and start a file removal workload. File removal tends to
 # reproduce the corruption more reliably.
 _scratch_inject_error log_item_pin 1

 rm -rf $SCRATCH_MNT/* > /dev/null 2>&1 &
 workpid=$!

 # wait for the head to stop pushing forward
 prevhead=-1
 head=`cat /sys/fs/xfs/$sdev/log/log_head_lsn`
 while [ "$head" != "$prevhead" ]; do
 	sleep 5
 	prevhead=$head
 	head=`cat /sys/fs/xfs/$sdev/log/log_head_lsn`
 done

 # Once the head is pinned behind the tail, enable log record corruption and
 # unpin the tail. All subsequent log buffer writes end up corrupted on-disk and
 # result in log I/O errors.
 _scratch_inject_error log_bad_crc 1
 _scratch_inject_error log_item_pin 0

 # wait for fs shutdown to kill the workload
 wait $workpid

 # cycle mount to test log recovery
 _scratch_cycle_mount

 # success, all done
 status=0
 exit
	#! /bin/bash
	# FS QA Test No. 057
	#
	# Attempt to reproduce log recovery failure by writing corrupt log records over
	# the last good tail in the log. The tail is force pinned while a workload runs
	# the head as close as possible behind the tail. Once the head is pinned,
	# corrupted log records are written to the log and the filesystem shuts down.
	#
	# While log recovery should handle the corrupted log records, it has historical
	# problems dealing with the situation where the corrupted log records may have
	# overwritten the tail of the previous good record in the log. If this occurs,
	# log recovery may fail.
	#
	# This can be reproduced more reliably under non-default conditions such as with
	# the smallest supported FSB sizes and/or largest supported log buffer sizes and
	# counts (logbufs and logbsize mount options).
	#
	# Note that this test requires a DEBUG mode kernel.
	#
	#-----------------------------------------------------------------------
	# Copyright (c) 2017 Red Hat, Inc. All Rights Reserved.
	#
	# This program is free software; you can redistribute it and/or
	# modify it under the terms of the GNU General Public License as
	# published by the Free Software Foundation.
	#
	# This program is distributed in the hope that it would be useful,
	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	# GNU General Public License for more details.
	#
	# You should have received a copy of the GNU General Public License
	# along with this program; if not, write the Free Software Foundation,
	# Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
	#-----------------------------------------------------------------------
	#

	seq=`basename $0`
	seqres=$RESULT_DIR/$seq
	echo "QA output created by $seq"

	here=`pwd`
	tmp=/tmp/$$
	status=1 # failure is the default!
	trap "_cleanup; exit \$status" 0 1 2 3 15

	_cleanup()
	{
	cd /
	rm -f $tmp.*
	$KILLALL_PROG -9 fsstress > /dev/null 2>&1
	[ -e /sys/fs/xfs/$sdev/errortag/log_item_pin ] &&
	echo 0 > /sys/fs/xfs/$sdev/errortag/log_item_pin
	wait > /dev/null 2>&1
	}

	rm -f $seqres.full

	# get standard environment, filters and checks
	. ./common/rc
	. ./common/inject

	# real QA test starts here

	# Modify as appropriate.
	_supported_fs xfs
	_supported_os Linux
	_require_xfs_io_error_injection log_item_pin
	_require_xfs_io_error_injection log_bad_crc
	_require_scratch
	_require_command "$KILLALL_PROG" killall

	echo "Silence is golden."

	sdev=$(_short_dev $SCRATCH_DEV)

	# use a small log fs
	_scratch_mkfs_sized $((1024 * 1024 * 500)) >> $seqres.full 2>&1 \|\|
	_fail "mkfs failed"
	_scratch_mount

	# populate the fs with some data and cycle the mount to reset the log head/tail
	$FSSTRESS_PROG -d $SCRATCH_MNT -z -fcreat=1 -p 4 -n 100000 > /dev/null 2>&1
	_scratch_cycle_mount \|\| _fail "cycle mount failed"

	# Pin the tail and start a file removal workload. File removal tends to
	# reproduce the corruption more reliably.
	_scratch_inject_error log_item_pin 1

	rm -rf $SCRATCH_MNT/* > /dev/null 2>&1 &
	workpid=$!

	# wait for the head to stop pushing forward
	prevhead=-1
	head=`cat /sys/fs/xfs/$sdev/log/log_head_lsn`
	while [ "$head" != "$prevhead" ]; do
	sleep 5
	prevhead=$head
	head=`cat /sys/fs/xfs/$sdev/log/log_head_lsn`
	done

	# Once the head is pinned behind the tail, enable log record corruption and
	# unpin the tail. All subsequent log buffer writes end up corrupted on-disk and
	# result in log I/O errors.
	_scratch_inject_error log_bad_crc 1
	_scratch_inject_error log_item_pin 0

	# wait for fs shutdown to kill the workload
	wait $workpid

	# cycle mount to test log recovery
	_scratch_cycle_mount

	# success, all done
	status=0
	exit