4 # Run fsstress and fio(dio/aio and mmap) and simulate disk failure
5 # check filesystem consistency at the end.
7 #-----------------------------------------------------------------------
8 # (c) 2013 Dmitry Monakhov
10 # This program is free software; you can redistribute it and/or
11 # modify it under the terms of the GNU General Public License as
12 # published by the Free Software Foundation.
14 # This program is distributed in the hope that it would be useful,
15 # but WITHOUT ANY WARRANTY; without even the implied warranty of
16 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 # GNU General Public License for more details.
19 # You should have received a copy of the GNU General Public License
20 # along with this program; if not, write the Free Software Foundation,
21 # Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
23 #-----------------------------------------------------------------------
26 owner=dmonakhov@openvz.org
29 echo "QA output created by $seq"
33 status=1 # failure is the default!
35 # get standard environment, filters and checks
38 _supported_fs ext3 ext4 xfs btrfs reiserfs
42 _require_fail_make_request
44 # TODO: Function are common enough to be moved to common.blkdev
45 SCRATCH_REAL_DEV=`readlink -f $SCRATCH_DEV`
46 SCRATCH_BDEV=`basename $SCRATCH_REAL_DEV`
48 allow_fail_make_request()
50 echo "Allow global fail_make_request feature"
51 echo 100 > $DEBUGFS_MNT/fail_make_request/probability
52 echo 9999999 > $DEBUGFS_MNT/fail_make_request/times
53 echo 0 > /sys/kernel/debug/fail_make_request/verbose
56 disallow_fail_make_request()
58 echo "Disallow global fail_make_request feature"
59 echo 0 > $DEBUGFS_MNT/fail_make_request/probability
60 echo 0 > $DEBUGFS_MNT/fail_make_request/times
63 start_fail_scratch_dev()
65 echo "Force SCRATCH_DEV device failure"
66 echo " echo 1 > /sys/block/$SCRATCH_BDEV/make-it-fail" >> $here/$seq.full
67 echo 1 > /sys/block/$SCRATCH_BDEV/make-it-fail
71 stop_fail_scratch_dev()
73 echo "Make SCRATCH_DEV device operable again"
74 echo " echo 0 > /sys/block/$SCRATCH_BDEV/make-it-fail" >> $here/$seq.full
75 echo 0 > /sys/block/$SCRATCH_BDEV/make-it-fail
82 disallow_fail_make_request
84 trap "_cleanup; exit \$status" 1 2 3 15
86 RUN_TIME=$((20+10*$TIME_FACTOR))
87 NUM_JOBS=$((4*LOAD_FACTOR))
88 BLK_DEV_SIZE=`blockdev --getsz $SCRATCH_DEV`
89 FILE_SIZE=$((BLK_DEV_SIZE * 512))
91 cat >$tmp-$seq.fio <<EOF
93 # $seq test's fio activity
94 # Filenames derived from jobsname and jobid like follows:
95 # ${JOB_NAME}.${JOB_ID}.${ITERATION_ID}
99 directory=${SCRATCH_MNT}
100 filesize=${FILE_SIZE}
102 continue_on_error=write
103 ignore_error=EIO,ENOSPC:EIO
106 [stress_dio_aio_activity]
109 iodepth=128*${LOAD_FACTOR}
114 runtime=40+${RUN_TIME}
117 [stress_mmap_activity]
126 runtime=40+${RUN_TIME}
131 _require_fio $tmp-$seq.fio
133 # Disable all sync operations to get higher load
134 FSSTRESS_AVOID="$FSSTRESS_AVOID -ffsync=0 -fsync=0 -ffdatasync=0 -f setattr=1"
138 out=$SCRATCH_MNT/fsstress.$$
139 args=`_scale_fsstress_args -p 1 -n999999999 -f setattr=0 $FSSTRESS_AVOID -d $out`
141 echo "Start fsstress.."
143 echo "fsstress $args" >> $here/$seq.full
144 $FSSTRESS_PROG $args > /dev/null 2>&1 &
147 cat $tmp-$seq.fio >> $seq.full
148 $FIO_PROG $tmp-$seq.fio >> $here/$seq.full 2>&1 &
151 # Let's it work for awhile, and force device failure
153 start_fail_scratch_dev
154 # After device turns in to failed state filesystem may yet not know about
155 # that so buffered write(2) may succeed, but any integrity operations
156 # such as (sync, fsync, fdatasync, direct-io) should fail.
157 dd if=/dev/zero of=$SCRATCH_MNT/touch_failed_filesystem count=1 bs=4k conv=fsync \
158 >> $here/$seq.full 2>&1 && \
159 _fail "failed: still able to perform integrity fsync on $SCRATCH_MNT"
165 # We expect that broken FS still can be umounted
166 run_check umount $SCRATCH_DEV
167 # Once filesystem was umounted no one is able to write to block device
168 # It is now safe to bring device back to normal state
169 stop_fail_scratch_dev
171 # In order to check that filesystem is able to recover journal on mount(2)
172 # perform mount/umount, after that all errors should be fixed
173 run_check _scratch_mount
174 run_check _scratch_unmount
178 # real QA test starts here
180 _scratch_mkfs >> $here/$seq.full 2>&1 || _fail "mkfs failed"
181 _scratch_mount || _fail "mount failed"
182 allow_fail_make_request
185 disallow_fail_make_request