blob: 715de458268ebc4f13875ffcd50f5f03ae7867c1 [file] [log] [blame]
#! /bin/bash
# SPDX-License-Identifier: GPL-2.0
# Copyright (c) 2025 IBM Corporation. All Rights Reserved.
#
# FS QA Test No. 778
#
# Test multi block atomic writes with sudden FS shutdowns to ensure
# the FS is not tearing the write operation
. ./common/preamble
. ./common/atomicwrites
_begin_fstest auto atomicwrites
_require_scratch_write_atomic_multi_fsblock
_require_atomic_write_test_commands
_require_scratch_shutdown
_require_xfs_io_command "truncate"
_scratch_mkfs >> $seqres.full 2>&1
_scratch_mount >> $seqres.full
testfile=$SCRATCH_MNT/testfile
touch $testfile
awloop_runfile=$tmp.awloop_running
awloop_killfile=$tmp.awloop_kill
awu_max=$(_get_atomic_write_unit_max $testfile)
blksz=$(_get_block_size $SCRATCH_MNT)
echo "Awu max: $awu_max" >> $seqres.full
num_blocks=$((awu_max / blksz))
# keep initial value high for dry run. This will be
# tweaked in dry_run() based on device write speed.
filesize=$(( 10 * 1024 * 1024 * 1024 ))
_cleanup() {
kill_awloop
}
atomic_write_loop() {
local off=0
local size=$awu_max
rm -f $awloop_killfile
touch $awloop_runfile
for ((i=0; i<$((filesize / $size )); i++)); do
# Due to sudden shutdown this can produce errors so just
# redirect them to seqres.full
$XFS_IO_PROG -c "open -fsd $testfile" -c "pwrite -S 0x61 -DA -V1 -b $size $off $size" >> /dev/null 2>>$seqres.full
if [ ! -w "$testfile" ] || [ -e "$awloop_killfile" ]; then
break
fi
echo "Written to offset: $((off + size))" >> $tmp.aw
off=$((off + size))
done
rm -f $awloop_runfile
}
# Use sentinel files to control the loop execution because we don't know the
# pid of the xfs_io process and so we can't wait for it directly. A bare
# wait command won't wait for a D-state xfs_io process so we can't do that
# either. We can't use killall because check-parallel, and we can't pkill
# because the pid namespacing code was removed withotu fixing check-parallel.
kill_awloop() {
test -e $awloop_runfile || return
touch $awloop_killfile
for ((i=0;i<300;i++)); do
test -e $awloop_runfile || break
sleep 0.1
done
}
start_atomic_write_and_shutdown() {
atomic_write_loop &
local max_loops=100
local i=0
# Wait for at least first write to be recorded or too much time passes
while [ ! -f "$tmp.aw" -a $i -le $max_loops ]; do
i=$((i + 1))
sleep 0.2
done
cat $tmp.aw >> $seqres.full
if [[ $i -gt $max_loops ]]
then
_notrun "atomic write process took too long to start"
fi
echo >> $seqres.full
echo "# Shutting down filesystem while write is running" >> $seqres.full
_scratch_shutdown
kill_awloop
}
# This test has the following flow:
# 1. Start doing sequential atomic writes in background, upto $filesize
# 2. Sleep for 0.2s and shutdown the FS
# 3. kill the atomic write process
# 4. verify the writes were not torn
#
# We ideally want the shutdown to happen while an atomic write is ongoing
# but this gets tricky since faster devices can actually finish the whole
# atomic write loop before sleep 0.2s completes, resulting in the shutdown
# happening after the write loop which is not what we want. A simple solution
# to this is to increase $filesize so step 1 takes long enough but a big
# $filesize leads to create_mixed_mappings() taking very long, which is not
# ideal.
#
# Hence, use the dry_run function to figure out the rough device speed and set
# $filesize accordingly.
dry_run() {
echo >> $seqres.full
echo "# Estimating ideal filesize..." >> $seqres.full
start_atomic_write_and_shutdown
bytes_written=$(tail -n 1 $tmp.aw | cut -d" " -f4)
echo "# Bytes written in 0.2s: $bytes_written" >> $seqres.full
filesize=$((bytes_written * 3))
echo "# Setting \$filesize=$filesize" >> $seqres.full
rm $tmp.aw
sleep 0.5
_scratch_cycle_mount
}
create_mixed_mappings() {
local file=$1
local size_bytes=$2
echo "# Filling file $file with alternate mappings till size $size_bytes" >> $seqres.full
#Fill the file with alternate written and unwritten blocks
local off=0
local operations=("W" "U")
test $size_bytes -eq 0 && return
# fallocate the whole file once because preallocating single blocks
# with individual xfs_io invocations is really slow and the allocator
# usually gives out consecutive blocks anyway
$XFS_IO_PROG -f -c "falloc 0 $size_bytes" $file
local cmds=()
for ((i=0; i<$((size_bytes / blksz )); i++)); do
if (( i % 2 == 0 )); then
cmds+=(-c "pwrite -b $blksz $off $blksz")
fi
# batch the write commands into larger xfs_io invocations to
# amortize the fork overhead
if [ "${#cmds[@]}" -ge 128 ]; then
$XFS_IO_PROG "${cmds[@]}" "$file" >> /dev/null
cmds=()
fi
off=$((off + blksz))
done
if [ "${#cmds[@]}" -gt 0 ]; then
$XFS_IO_PROG "${cmds[@]}" "$file" >> /dev/null
cmds=()
fi
sync $file
}
populate_expected_data() {
# create a dummy file with expected old data for different cases
create_mixed_mappings $testfile.exp_old_mixed $awu_max
expected_data_old_mixed=$(od -An -t x1 -j 0 -N $awu_max $testfile.exp_old_mixed)
$XFS_IO_PROG -fc "falloc 0 $awu_max" $testfile.exp_old_zeroes >> $seqres.full
expected_data_old_zeroes=$(od -An -t x1 -j 0 -N $awu_max $testfile.exp_old_zeroes)
$XFS_IO_PROG -fc "pwrite -b $awu_max 0 $awu_max" $testfile.exp_old_mapped >> $seqres.full
expected_data_old_mapped=$(od -An -t x1 -j 0 -N $awu_max $testfile.exp_old_mapped)
# create a dummy file with expected new data
$XFS_IO_PROG -fc "pwrite -S 0x61 -b $awu_max 0 $awu_max" $testfile.exp_new >> $seqres.full
expected_data_new=$(od -An -t x1 -j 0 -N $awu_max $testfile.exp_new)
}
verify_data_blocks() {
local verify_start=$1
local verify_end=$2
local expected_data_old="$3"
local expected_data_new="$4"
echo >> $seqres.full
echo "# Checking for torn write from $verify_start to $verify_end" >> $seqres.full
# After an atomic write, for every chunk we ensure that the underlying
# data is either the old data or new data as writes shouldn't get torn.
local off=$verify_start
while [[ "$off" -lt "$verify_end" ]]
do
#actual_data=$(xxd -s $off -l $awu_max -p $testfile)
actual_data=$(od -An -t x1 -j $off -N $awu_max $testfile)
if [[ "$actual_data" != "$expected_data_new" ]] && [[ "$actual_data" != "$expected_data_old" ]]
then
echo "Checksum match failed at off: $off size: $awu_max"
echo "Expected contents: (Either of the 2 below):"
echo
echo "Old: "
echo "$expected_data_old"
echo
echo "New: "
echo "$expected_data_new"
echo
echo "Actual contents: "
echo "$actual_data"
_fail
fi
echo -n "Check at offset $off succeeded! " >> $seqres.full
if [[ "$actual_data" == "$expected_data_new" ]]
then
echo "matched new" >> $seqres.full
elif [[ "$actual_data" == "$expected_data_old" ]]
then
echo "matched old" >> $seqres.full
fi
off=$(( off + awu_max ))
done
}
# test torn write for file by shutting down in between atomic writes
test_torn_write() {
echo >> $seqres.full
echo "# Writing atomically to file in background" >> $seqres.full
start_atomic_write_and_shutdown
last_offset=$(tail -n 1 $tmp.aw | cut -d" " -f4)
if [[ -z $last_offset ]]
then
last_offset=0
fi
echo >> $seqres.full
echo "# Last offset of atomic write: $last_offset" >> $seqres.full
rm $tmp.aw
sleep 0.5
_scratch_cycle_mount
# we want to verify all blocks around which the shutdown happened
verify_start=$(( last_offset - (awu_max * 5)))
if [[ $verify_start < 0 ]]
then
verify_start=0
fi
verify_end=$(( last_offset + (awu_max * 5)))
if [[ "$verify_end" -gt "$filesize" ]]
then
verify_end=$filesize
fi
}
# test torn write for file with written and unwritten mappings
test_torn_write_mixed() {
$XFS_IO_PROG -fc "truncate 0" $testfile >> $seqres.full
echo >> $seqres.full
echo "# Creating testfile with mixed mappings" >> $seqres.full
create_mixed_mappings $testfile $filesize
test_torn_write
verify_data_blocks $verify_start $verify_end "$expected_data_old_mixed" "$expected_data_new"
}
# test torn write for file with completely written mappings
test_torn_write_written() {
$XFS_IO_PROG -fc "truncate 0" $testfile >> $seqres.full
echo >> $seqres.full
echo "# Creating testfile with fully written mapping" >> $seqres.full
$XFS_IO_PROG -c "pwrite -b $filesize 0 $filesize" $testfile >> $seqres.full
sync $testfile
test_torn_write
verify_data_blocks $verify_start $verify_end "$expected_data_old_mapped" "$expected_data_new"
}
# test torn write for file with completely unwritten mappings
test_torn_write_unwritten() {
$XFS_IO_PROG -fc "truncate 0" $testfile >> $seqres.full
echo >> $seqres.full
echo "# Creating testfile with fully unwritten mappings" >> $seqres.full
$XFS_IO_PROG -c "falloc 0 $filesize" $testfile >> $seqres.full
sync $testfile
test_torn_write
verify_data_blocks $verify_start $verify_end "$expected_data_old_zeroes" "$expected_data_new"
}
# test torn write for file with no mappings
test_torn_write_hole() {
$XFS_IO_PROG -fc "truncate 0" $testfile >> $seqres.full
echo >> $seqres.full
echo "# Creating testfile with no mappings" >> $seqres.full
$XFS_IO_PROG -c "truncate $filesize" $testfile >> $seqres.full
sync $testfile
test_torn_write
verify_data_blocks $verify_start $verify_end "$expected_data_old_zeroes" "$expected_data_new"
}
test_append_torn_write() {
$XFS_IO_PROG -c "truncate 0" $testfile >> $seqres.full
echo >> $seqres.full
echo "# Performing append atomic writes over file in background" >> $seqres.full
start_atomic_write_and_shutdown
local last_offset=$(tail -n 1 $tmp.aw | cut -d" " -f4)
if [[ -z $last_offset ]]
then
last_offset=0
fi
echo >> $seqres.full
echo "# Last offset of atomic write: $last_offset" >> $seqres.full
rm $tmp.aw
sleep 0.5
_scratch_cycle_mount
local filesize=$(_get_filesize $testfile)
echo >> $seqres.full
echo "# Filesize after shutdown: $filesize" >> $seqres.full
# To confirm that the write went atomically, we check:
# 1. The last block should be a multiple of awu_max
# 2. The last block should be the completely new data
if (( $filesize % $awu_max ))
then
echo "Filesize after shutdown ($filesize) not a multiple of atomic write unit ($awu_max)"
fi
verify_start=$(( filesize - (awu_max * 5)))
if [[ $verify_start < 0 ]]
then
verify_start=0
fi
local verify_end=$filesize
# Here the blocks should always match new data hence, for simplicity of
# code, just corrupt the $expected_data_old buffer so it never matches
local expected_data_old="POISON"
verify_data_blocks $verify_start $verify_end "$expected_data_old" "$expected_data_new"
}
$XFS_IO_PROG -fc "truncate 0" $testfile >> $seqres.full
dry_run
echo >> $seqres.full
echo "# Populating expected data buffers" >> $seqres.full
populate_expected_data
# Loop to shake out any races due to shutdown
iter=0
while _soak_loop_running $TIME_FACTOR; do
echo >> $seqres.full
echo "------ Iteration $iter ------" >> $seqres.full
echo >> $seqres.full
echo "# Starting torn write test for atomic writes over mixed mapping" >> $seqres.full
test_torn_write_mixed
echo >> $seqres.full
echo "# Starting torn write test for atomic writes over fully written mapping" >> $seqres.full
test_torn_write_written
echo >> $seqres.full
echo "# Starting torn write test for atomic writes over fully unwritten mapping" >> $seqres.full
test_torn_write_unwritten
echo >> $seqres.full
echo "# Starting torn write test for atomic writes over holes" >> $seqres.full
test_torn_write_hole
echo >> $seqres.full
echo "# Starting shutdown torn write test for append atomic writes" >> $seqres.full
test_append_torn_write
iter=$((iter + 1))
done
echo "Silence is golden"
status=0
exit