--- /dev/null
+#!/bin/bash
+# vim:expandtab:shiftwidth=4:softtabstop=4:tabstop=4:
+#
+# Tests for multiple mount protection (MMP) feature.
+#
+# Run select tests by setting ONLY, or as arguments to the script.
+# Skip specific tests by setting EXCEPT.
+#
+# e.g. ONLY="5 6" or ONLY="`seq 8 11`" or EXCEPT="7"
+set -e
+
+ONLY=${ONLY:-"$*"}
+
+# bug number for skipped test:
+ALWAYS_EXCEPT=${ALWAYS_EXCEPT:-"$MMP_EXCEPT"}
+# UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT!
+
+SRCDIR=$(cd $(dirname $0); echo $PWD)
+export PATH=$PWD/$SRCDIR:$SRCDIR:$SRCDIR/../utils:$PATH:/sbin
+
+LUSTRE=${LUSTRE:-$(cd $(dirname $0)/..; echo $PWD)}
+. $LUSTRE/tests/test-framework.sh
+init_test_env $@
+. ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh}
+init_logging
+
+remote_mds_nodsh && skip "remote MDS with nodsh" && exit 0
+remote_ost_nodsh && skip "remote OST with nodsh" && exit 0
+
+# unmount and cleanup the Lustre filesystem
+MMP_RESTORE_MOUNT=false
+if is_mounted $MOUNT || is_mounted $MOUNT2; then
+ cleanupall
+ MMP_RESTORE_MOUNT=true
+fi
+
+SAVED_FAIL_ON_ERROR=$FAIL_ON_ERROR
+FAIL_ON_ERROR=false
+
+build_test_filter
+
+# Get the failover facet.
+get_failover_facet() {
+ local facet=$1
+ local failover_facet=${facet}failover
+
+ local host=$(facet_host $facet)
+ local failover_host=$(facet_host $failover_facet)
+
+ [ -z "$failover_host" -o "$host" = "$failover_host" ] && \
+ failover_facet=$facet
+
+ echo $failover_facet
+}
+
+# Initiate the variables for Lustre servers and targets.
+init_vars() {
+ MMP_MDS=${MMP_MDS:-$SINGLEMDS}
+ MMP_MDS_FAILOVER=$(get_failover_facet $MMP_MDS)
+
+ local mds_num=$(echo $MMP_MDS | tr -d "mds")
+ MMP_MDSDEV=$(mdsdevname $mds_num)
+
+ MMP_OSS=${MMP_OSS:-ost1}
+ MMP_OSS_FAILOVER=$(get_failover_facet $MMP_OSS)
+
+ local oss_num=$(echo $MMP_OSS | tr -d "ost")
+ MMP_OSTDEV=$(ostdevname $oss_num)
+}
+
+# Stop the MDS and OSS services on the primary or failover servers.
+stop_services() {
+ local flavor=$1
+ shift
+ local opts="$@"
+ local mds_facet
+ local oss_facet
+
+ if [ "$flavor" = "failover" ]; then
+ mds_facet=$MMP_MDS_FAILOVER
+ oss_facet=$MMP_OSS_FAILOVER
+ else
+ mds_facet=$MMP_MDS
+ oss_facet=$MMP_OSS
+ fi
+
+ stop $mds_facet $opts || return ${PIPESTATUS[0]}
+ stop $oss_facet $opts || return ${PIPESTATUS[0]}
+}
+
+# Enable the MMP feature.
+enable_mmp() {
+ local facet=$1
+ local device=$2
+
+ do_facet $facet "$TUNE2FS -O mmp $device"
+ return ${PIPESTATUS[0]}
+}
+
+# Disable the MMP feature.
+disable_mmp() {
+ local facet=$1
+ local device=$2
+
+ do_facet $facet "$TUNE2FS -O ^mmp $device"
+ return ${PIPESTATUS[0]}
+}
+
+# Reset the MMP block (if any) back to the clean state.
+reset_mmp_block() {
+ local facet=$1
+ local device=$2
+
+ do_facet $facet "$TUNE2FS -f -E clear-mmp $device"
+ return ${PIPESTATUS[0]}
+}
+
+# Check whether the MMP feature is enabled or not.
+mmp_is_enabled() {
+ local facet=$1
+ local device=$2
+
+ do_facet $facet "$DUMPE2FS -h $device | grep mmp"
+ return ${PIPESTATUS[0]}
+}
+
+# Get MMP update interval (in seconds) from the Lustre server target.
+get_mmp_update_interval() {
+ local facet=$1
+ local device=$2
+ local interval
+
+ interval=$(do_facet $facet "$DEBUGFS -c -R dump_mmp $device 2>/dev/null \
+ | grep 'MMP Update Interval' | cut -d' ' -f4")
+ [ -z "$interval" ] && interval=1
+
+ echo $interval
+}
+
+# Get MMP check interval (in seconds) from the Lustre server target.
+get_mmp_check_interval() {
+ local facet=$1
+ local device=$2
+ local interval
+
+ interval=$(do_facet $facet "$DEBUGFS -c -R dump_mmp $device 2>/dev/null \
+ | grep 'MMP Check Interval' | cut -d' ' -f4")
+ [ -z "$interval" ] && interval=5
+
+ echo $interval
+}
+
+# Enable the MMP feature on the Lustre server targets.
+mmp_init() {
+ init_vars
+
+ # The MMP feature is automatically enabled by mkfs.lustre for
+ # new file system at format time if failover is being used.
+ # Otherwise, the Lustre administrator has to manually enable
+ # this feature when the file system is unmounted.
+
+ if [ -z "$mdsfailover_HOST" ]; then
+ log "Failover is not used on MDS, enabling MMP manually..."
+ enable_mmp $MMP_MDS $MMP_MDSDEV || \
+ error "failed to enable MMP on $MMP_MDSDEV on $MMP_MDS"
+ fi
+
+ if [ -z "$ostfailover_HOST" ]; then
+ log "Failover is not used on OSS, enabling MMP manually..."
+ enable_mmp $MMP_OSS $MMP_OSTDEV || \
+ error "failed to enable MMP on $MMP_OSTDEV on $MMP_OSS"
+ fi
+
+ # check whether the MMP feature is enabled or not
+ mmp_is_enabled $MMP_MDS $MMP_MDSDEV || \
+ error "MMP was not enabled on $MMP_MDSDEV on $MMP_MDS"
+
+ mmp_is_enabled $MMP_OSS $MMP_OSTDEV || \
+ error "MMP was not enabled on $MMP_OSTDEV on $MMP_OSS"
+}
+
+# Disable the MMP feature on the Lustre server targets
+# which did not use failover.
+mmp_fini() {
+
+ if [ -z "$mdsfailover_HOST" ]; then
+ log "Failover is not used on MDS, disabling MMP manually..."
+ disable_mmp $MMP_MDS $MMP_MDSDEV || \
+ error "failed to disable MMP on $MMP_MDSDEV on $MMP_MDS"
+ mmp_is_enabled $MMP_MDS $MMP_MDSDEV && \
+ error "MMP was not disabled on $MMP_MDSDEV on $MMP_MDS"
+ fi
+
+ if [ -z "$ostfailover_HOST" ]; then
+ log "Failover is not used on OSS, disabling MMP manually..."
+ disable_mmp $MMP_OSS $MMP_OSTDEV || \
+ error "failed to disable MMP on $MMP_OSTDEV on $MMP_OSS"
+ mmp_is_enabled $MMP_OSS $MMP_OSTDEV && \
+ error "MMP was not disabled on $MMP_OSTDEV on $MMP_OSS"
+ fi
+
+ return 0
+}
+
+# Mount the shared target on the failover server after some interval it's
+# mounted on the primary server.
+mount_after_interval_sub() {
+ local interval=$1
+ shift
+ local device=$1
+ shift
+ local facet=$1
+ shift
+ local opts="$@"
+ local failover_facet=$(get_failover_facet $facet)
+
+ local mount_pid
+ local first_mount_rc=0
+ local second_mount_rc=0
+
+ log "Mounting $device on $facet..."
+ start $facet $device $opts &
+ mount_pid=$!
+
+ if [ $interval -ne 0 ]; then
+ log "sleep $interval..."
+ sleep $interval
+ fi
+
+ log "Mounting $device on $failover_facet..."
+ start $failover_facet $device $opts
+ second_mount_rc=${PIPESTATUS[0]}
+
+ wait $mount_pid
+ first_mount_rc=${PIPESTATUS[0]}
+
+ if [ $second_mount_rc -eq 0 -a $first_mount_rc -eq 0 ]; then
+ error_noexit "one mount delayed by mmp interval $interval should fail"
+ stop $facet || return ${PIPESTATUS[0]}
+ [ "$failover_facet" != "$facet" ] && stop $failover_facet || \
+ return ${PIPESTATUS[0]}
+ return 1
+ elif [ $second_mount_rc -ne 0 -a $first_mount_rc -ne 0 ]; then
+ error_noexit "failed to mount on the failover pair $facet,$failover_facet"
+ return $first_mount_rc
+ fi
+
+ return 0
+}
+
+mount_after_interval() {
+ local mdt_interval=$1
+ local ost_interval=$2
+ local rc=0
+
+ mount_after_interval_sub $mdt_interval $MMP_MDSDEV $MMP_MDS \
+ $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
+
+ echo
+ mount_after_interval_sub $ost_interval $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ stop $MMP_MDS
+ return $rc
+ fi
+
+ return 0
+}
+
+# Mount the shared target on the failover server
+# during unmounting it on the primary server.
+mount_during_unmount() {
+ local device=$1
+ shift
+ local facet=$1
+ shift
+ local mnt_opts="$@"
+ local failover_facet=$(get_failover_facet $facet)
+
+ local unmount_pid
+ local unmount_rc=0
+ local mount_rc=0
+
+ log "Mounting $device on $facet..."
+ start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
+
+ log "Unmounting $device on $facet..."
+ stop $facet &
+ unmount_pid=$!
+
+ log "Mounting $device on $failover_facet..."
+ start $failover_facet $device $mnt_opts
+ mount_rc=${PIPESTATUS[0]}
+
+ wait $unmount_pid
+ unmount_rc=${PIPESTATUS[0]}
+
+ if [ $mount_rc -eq 0 ]; then
+ error_noexit "mount during unmount of the first filesystem should fail"
+ stop $failover_facet || return ${PIPESTATUS[0]}
+ return 1
+ fi
+
+ if [ $unmount_rc -ne 0 ]; then
+ error_noexit "unmount the $device on $facet should succeed"
+ return $unmount_rc
+ fi
+
+ return 0
+}
+
+# Mount the shared target on the failover server
+# after clean unmounting it on the primary server.
+mount_after_unmount() {
+ local device=$1
+ shift
+ local facet=$1
+ shift
+ local mnt_opts="$@"
+ local failover_facet=$(get_failover_facet $facet)
+
+ log "Mounting $device on $facet..."
+ start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
+
+ log "Unmounting $device on $facet..."
+ stop $facet || return ${PIPESTATUS[0]}
+
+ log "Mounting $device on $failover_facet..."
+ start $failover_facet $device $mnt_opts || return ${PIPESTATUS[0]}
+
+ return 0
+}
+
+# Mount the shared target on the failover server after rebooting
+# the primary server.
+mount_after_reboot() {
+ local device=$1
+ shift
+ local facet=$1
+ shift
+ local mnt_opts="$@"
+ local failover_facet=$(get_failover_facet $facet)
+ local rc=0
+
+ log "Mounting $device on $facet..."
+ start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
+
+ if [ "$FAILURE_MODE" = "HARD" ]; then
+ shutdown_facet $facet
+ reboot_facet $facet
+ wait_for $facet
+ else
+ replay_barrier_nodf $facet
+ fi
+
+ log "Mounting $device on $failover_facet..."
+ start $failover_facet $device $mnt_opts
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ error_noexit "mount $device on $failover_facet should succeed"
+ stop $facet || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+
+ return 0
+}
+
+# Run e2fsck on the Lustre server target.
+run_e2fsck() {
+ local facet=$1
+ shift
+ local device=$1
+ shift
+ local opts="$@"
+
+ log "Running e2fsck on the device $device on $facet..."
+ do_facet $facet "$E2FSCK $opts $device"
+ return ${PIPESTATUS[0]}
+}
+
+# Check whether there are failover pairs for MDS and OSS servers.
+check_failover_pair() {
+ [ "$MMP_MDS" = "$MMP_MDS_FAILOVER" -o "$MMP_OSS" = "$MMP_OSS_FAILOVER" ] \
+ && { skip_env "failover pair is needed" && return 1; }
+ return 0
+}
+
+mmp_init
+
+# Test 1 - two mounts at the same time.
+test_1() {
+ check_failover_pair || return 0
+
+ mount_after_interval 0 0 || return ${PIPESTATUS[0]}
+ stop_services primary || return ${PIPESTATUS[0]}
+}
+run_test 1 "two mounts at the same time"
+
+# Test 2 - one mount delayed by mmp update interval.
+test_2() {
+ check_failover_pair || return 0
+
+ local mdt_interval=$(get_mmp_update_interval $MMP_MDS $MMP_MDSDEV)
+ local ost_interval=$(get_mmp_update_interval $MMP_OSS $MMP_OSTDEV)
+
+ mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
+ stop_services primary || return ${PIPESTATUS[0]}
+}
+run_test 2 "one mount delayed by mmp update interval"
+
+# Test 3 - one mount delayed by 2x mmp check interval.
+test_3() {
+ check_failover_pair || return 0
+
+ local mdt_interval=$(get_mmp_check_interval $MMP_MDS $MMP_MDSDEV)
+ local ost_interval=$(get_mmp_check_interval $MMP_OSS $MMP_OSTDEV)
+
+ mdt_interval=$((2 * $mdt_interval + 1))
+ ost_interval=$((2 * $ost_interval + 1))
+
+ mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
+ stop_services primary || return ${PIPESTATUS[0]}
+}
+run_test 3 "one mount delayed by 2x mmp check interval"
+
+# Test 4 - one mount delayed by > 2x mmp check interval.
+test_4() {
+ check_failover_pair || return 0
+
+ local mdt_interval=$(get_mmp_check_interval $MMP_MDS $MMP_MDSDEV)
+ local ost_interval=$(get_mmp_check_interval $MMP_OSS $MMP_OSTDEV)
+
+ mdt_interval=$((4 * $mdt_interval))
+ ost_interval=$((4 * $ost_interval))
+
+ mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
+ stop_services primary || return ${PIPESTATUS[0]}
+}
+run_test 4 "one mount delayed by > 2x mmp check interval"
+
+# Test 5 - mount during unmount of the first filesystem.
+test_5() {
+ local rc=0
+ check_failover_pair || return 0
+
+ mount_during_unmount $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
+ return ${PIPESTATUS[0]}
+
+ echo
+ start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
+ mount_during_unmount $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+}
+run_test 5 "mount during unmount of the first filesystem"
+
+# Test 6 - mount after clean unmount.
+test_6() {
+ local rc=0
+ check_failover_pair || return 0
+
+ mount_after_unmount $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
+ return ${PIPESTATUS[0]}
+
+ echo
+ mount_after_unmount $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+
+ stop_services failover || return ${PIPESTATUS[0]}
+}
+run_test 6 "mount after clean unmount"
+
+# Test 7 - mount after reboot.
+test_7() {
+ local rc=0
+ check_failover_pair || return 0
+
+ mount_after_reboot $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
+ return ${PIPESTATUS[0]}
+
+ echo
+ mount_after_reboot $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+
+ stop_services failover || return ${PIPESTATUS[0]}
+ stop_services primary || return ${PIPESTATUS[0]}
+}
+run_test 7 "mount after reboot"
+
+# Test 8 - mount during e2fsck (should never succeed).
+test_8() {
+ local e2fsck_pid
+
+ run_e2fsck $MMP_MDS $MMP_MDSDEV "-fy" &
+ e2fsck_pid=$!
+ sleep 1
+
+ log "Mounting $MMP_MDSDEV on $MMP_MDS_FAILOVER..."
+ if start $MMP_MDS_FAILOVER $MMP_MDSDEV $MDS_MOUNT_OPTS; then
+ error_noexit "mount $MMP_MDSDEV on $MMP_MDS_FAILOVER should fail"
+ stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
+ return 1
+ fi
+
+ wait $e2fsck_pid
+
+ echo
+ run_e2fsck $MMP_OSS $MMP_OSTDEV "-fy" &
+ e2fsck_pid=$!
+ sleep 1
+
+ log "Mounting $MMP_OSTDEV on $MMP_OSS_FAILOVER..."
+ if start $MMP_OSS_FAILOVER $MMP_OSTDEV $OST_MOUNT_OPTS; then
+ error_noexit "mount $MMP_OSTDEV on $MMP_OSS_FAILOVER should fail"
+ stop $MMP_OSS_FAILOVER || return ${PIPESTATUS[0]}
+ return 2
+ fi
+
+ wait $e2fsck_pid
+ return 0
+}
+run_test 8 "mount during e2fsck"
+
+# Test 9 - mount after aborted e2fsck (should never succeed).
+test_9() {
+ local e2fsck_pid
+ local mdt_mmp_check_interval
+ local ost_mmp_check_interval
+
+ start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
+ if ! start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS; then
+ local rc=${PIPESTATUS[0]}
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+ stop_services primary || return ${PIPESTATUS[0]}
+
+ mdt_mmp_check_interval=$(get_mmp_check_interval $MMP_MDS $MMP_MDSDEV)
+ run_e2fsck $MMP_MDS_FAILOVER $MMP_MDSDEV "-fy" &
+ e2fsck_pid=$!
+ sleep $((2 * $mdt_mmp_check_interval + 1))
+ kill -s ABRT $e2fsck_pid
+
+ log "Mounting $MMP_MDSDEV on $MMP_MDS..."
+ if start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS; then
+ error_noexit "mount $MMP_MDSDEV on $MMP_MDS should fail"
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ return 1
+ fi
+
+ reset_mmp_block $MMP_MDS $MMP_MDSDEV || return ${PIPESTATUS[0]}
+
+ echo
+ ost_mmp_check_interval=$(get_mmp_check_interval $MMP_OSS $MMP_OSTDEV)
+ run_e2fsck $MMP_OSS_FAILOVER $MMP_OSTDEV "-fy" &
+ e2fsck_pid=$!
+ sleep $((2 * $ost_mmp_check_interval + 1))
+ kill -s ABRT $e2fsck_pid
+
+ log "Mounting $MMP_OSTDEV on $MMP_OSS..."
+ if start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS; then
+ error_noexit "mount $MMP_OSTDEV on $MMP_OSS should fail"
+ stop $MMP_OSS || return ${PIPESTATUS[0]}
+ return 2
+ fi
+
+ reset_mmp_block $MMP_OSS $MMP_OSTDEV || return ${PIPESTATUS[0]}
+ return 0
+}
+run_test 9 "mount after aborted e2fsck"
+
+# Test 10 - e2fsck with mounted filesystem.
+test_10() {
+ local rc=0
+
+ log "Mounting $MMP_MDSDEV on $MMP_MDS..."
+ start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
+
+ run_e2fsck $MMP_MDS_FAILOVER $MMP_MDSDEV "-fn"
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 8 ]; then
+ error_noexit "e2fsck $MMP_MDSDEV on $MMP_MDS_FAILOVER should return 8"
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ [ $rc -ne 0 ] && return $rc || return 1
+ fi
+
+ log "Mounting $MMP_OSTDEV on $MMP_OSS..."
+ start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 0 ]; then
+ stop $MMP_MDS || return ${PIPESTATUS[0]}
+ return $rc
+ fi
+
+ run_e2fsck $MMP_OSS_FAILOVER $MMP_OSTDEV "-fn"
+ rc=${PIPESTATUS[0]}
+ if [ $rc -ne 8 ]; then
+ error_noexit "e2fsck $MMP_OSTDEV on $MMP_OSS_FAILOVER should return 8"
+ stop_services primary || return ${PIPESTATUS[0]}
+ [ $rc -ne 0 ] && return $rc || return 1
+ fi
+
+ stop_services primary || return ${PIPESTATUS[0]}
+ return 0
+}
+run_test 10 "e2fsck with mounted filesystem"
+
+mmp_fini
+FAIL_ON_ERROR=$SAVED_FAIL_ON_ERROR
+
+equals_msg $(basename $0): test complete
+$MMP_RESTORE_MOUNT && setupall
+[ -f "$TESTSUITELOG" ] && cat $TESTSUITELOG && \
+ grep -q FAIL $TESTSUITELOG && exit 1 || true
+echo "$0: completed"