2 # -*- mode: Bash; tab-width: 4; indent-tabs-mode: t; -*-
3 # vim:shiftwidth=4:softtabstop=4:tabstop=4:
5 # Tests for multiple mount protection (MMP) feature.
7 # Run select tests by setting ONLY, or as arguments to the script.
8 # Skip specific tests by setting EXCEPT.
10 # e.g. ONLY="5 6" or ONLY="`seq 8 11`" or EXCEPT="7"
15 # bug number for skipped test:
16 ALWAYS_EXCEPT=${ALWAYS_EXCEPT:-"$MMP_EXCEPT"}
17 # UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT!
19 SRCDIR=$(cd $(dirname $0); echo $PWD)
20 export PATH=$PWD/$SRCDIR:$SRCDIR:$SRCDIR/../utils:$PATH:/sbin
22 LUSTRE=${LUSTRE:-$(cd $(dirname $0)/..; echo $PWD)}
23 . $LUSTRE/tests/test-framework.sh
25 . ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh}
28 remote_mds_nodsh && skip "remote MDS with nodsh" && exit 0
29 remote_ost_nodsh && skip "remote OST with nodsh" && exit 0
31 # unmount and cleanup the Lustre filesystem
32 MMP_RESTORE_MOUNT=false
33 if is_mounted $MOUNT || is_mounted $MOUNT2; then
35 MMP_RESTORE_MOUNT=true
38 SAVED_FAIL_ON_ERROR=$FAIL_ON_ERROR
43 # Get the failover facet.
44 get_failover_facet() {
46 local failover_facet=${facet}failover
48 local host=$(facet_host $facet)
49 local failover_host=$(facet_host $failover_facet)
51 [ -z "$failover_host" -o "$host" = "$failover_host" ] && \
57 # Initiate the variables for Lustre servers and targets.
59 MMP_MDS=${MMP_MDS:-$SINGLEMDS}
60 MMP_MDS_FAILOVER=$(get_failover_facet $MMP_MDS)
62 local mds_num=$(echo $MMP_MDS | tr -d "mds")
63 MMP_MDSDEV=$(mdsdevname $mds_num)
65 MMP_OSS=${MMP_OSS:-ost1}
66 MMP_OSS_FAILOVER=$(get_failover_facet $MMP_OSS)
68 local oss_num=$(echo $MMP_OSS | tr -d "ost")
69 MMP_OSTDEV=$(ostdevname $oss_num)
72 # Stop the MDS and OSS services on the primary or failover servers.
80 if [ "$flavor" = "failover" ]; then
81 mds_facet=$MMP_MDS_FAILOVER
82 oss_facet=$MMP_OSS_FAILOVER
88 stop $mds_facet $opts || return ${PIPESTATUS[0]}
89 stop $oss_facet $opts || return ${PIPESTATUS[0]}
92 # Enable the MMP feature.
97 do_facet $facet "$TUNE2FS -O mmp $device"
98 return ${PIPESTATUS[0]}
101 # Disable the MMP feature.
106 do_facet $facet "$TUNE2FS -O ^mmp $device"
107 return ${PIPESTATUS[0]}
110 # Set the MMP block to 'fsck' state
115 do_facet $facet "$LUSTRE/tests/mmp_mark.sh $device"
116 return ${PIPESTATUS[0]}
119 # Reset the MMP block (if any) back to the clean state.
124 do_facet $facet "$TUNE2FS -f -E clear-mmp $device"
125 return ${PIPESTATUS[0]}
128 # Check whether the MMP feature is enabled or not.
133 do_facet $facet "$DUMPE2FS -h $device | grep mmp"
134 return ${PIPESTATUS[0]}
137 # Get MMP update interval (in seconds) from the Lustre server target.
138 get_mmp_update_interval() {
143 interval=$(do_facet $facet "$DEBUGFS -c -R dump_mmp $device 2>/dev/null \
144 | grep 'MMP Update Interval' | cut -d' ' -f4")
145 [ -z "$interval" ] && interval=1
150 # Get MMP check interval (in seconds) from the Lustre server target.
151 get_mmp_check_interval() {
156 interval=$(do_facet $facet "$DEBUGFS -c -R dump_mmp $device 2>/dev/null \
157 | grep 'MMP Check Interval' | cut -d' ' -f4")
158 [ -z "$interval" ] && interval=5
163 # Enable the MMP feature on the Lustre server targets.
167 if [ $(facet_fstype $MMP_MDS) != ldiskfs ]; then
168 skip "Only applicable to ldiskfs-based MDTs"
172 if [ $(facet_fstype $MMP_OSS) != ldiskfs ]; then
173 skip "Only applicable to ldiskfs-based OSTs"
177 # The MMP feature is automatically enabled by mkfs.lustre for
178 # new file system at format time if failover is being used.
179 # Otherwise, the Lustre administrator has to manually enable
180 # this feature when the file system is unmounted.
182 local var=${MMP_MDS}failover_HOST
183 if [ -z "${!var}" ]; then
184 log "Failover is not used on MDS, enabling MMP manually..."
185 enable_mmp $MMP_MDS $MMP_MDSDEV || \
186 error "failed to enable MMP on $MMP_MDSDEV on $MMP_MDS"
189 var=${MMP_OSS}failover_HOST
190 if [ -z "${!var}" ]; then
191 log "Failover is not used on OSS, enabling MMP manually..."
192 enable_mmp $MMP_OSS $MMP_OSTDEV || \
193 error "failed to enable MMP on $MMP_OSTDEV on $MMP_OSS"
196 # check whether the MMP feature is enabled or not
197 mmp_is_enabled $MMP_MDS $MMP_MDSDEV || \
198 error "MMP was not enabled on $MMP_MDSDEV on $MMP_MDS"
200 mmp_is_enabled $MMP_OSS $MMP_OSTDEV || \
201 error "MMP was not enabled on $MMP_OSTDEV on $MMP_OSS"
204 # Disable the MMP feature on the Lustre server targets
205 # which did not use failover.
208 local var=${MMP_MDS}failover_HOST
209 if [ -z "${!var}" ]; then
210 log "Failover is not used on MDS, disabling MMP manually..."
211 disable_mmp $MMP_MDS $MMP_MDSDEV || \
212 error "failed to disable MMP on $MMP_MDSDEV on $MMP_MDS"
213 mmp_is_enabled $MMP_MDS $MMP_MDSDEV && \
214 error "MMP was not disabled on $MMP_MDSDEV on $MMP_MDS"
217 var=${MMP_OSS}failover_HOST
218 if [ -z "${!var}" ]; then
219 log "Failover is not used on OSS, disabling MMP manually..."
220 disable_mmp $MMP_OSS $MMP_OSTDEV || \
221 error "failed to disable MMP on $MMP_OSTDEV on $MMP_OSS"
222 mmp_is_enabled $MMP_OSS $MMP_OSTDEV && \
223 error "MMP was not disabled on $MMP_OSTDEV on $MMP_OSS"
229 # Mount the shared target on the failover server after some interval it's
230 # mounted on the primary server.
231 mount_after_interval_sub() {
239 local failover_facet=$(get_failover_facet $facet)
242 local first_mount_rc=0
243 local second_mount_rc=0
245 log "Mounting $device on $facet..."
246 start $facet $device $opts &
249 if [ $interval -ne 0 ]; then
250 log "sleep $interval..."
254 log "Mounting $device on $failover_facet..."
255 start $failover_facet $device $opts
256 second_mount_rc=${PIPESTATUS[0]}
259 first_mount_rc=${PIPESTATUS[0]}
261 if [ $second_mount_rc -eq 0 -a $first_mount_rc -eq 0 ]; then
262 error_noexit "one mount delayed by mmp interval $interval should fail"
263 stop $facet || return ${PIPESTATUS[0]}
264 [ "$failover_facet" != "$facet" ] && stop $failover_facet || \
265 return ${PIPESTATUS[0]}
267 elif [ $second_mount_rc -ne 0 -a $first_mount_rc -ne 0 ]; then
268 error_noexit "mount failure on failover pair $facet,$failover_facet"
269 return $first_mount_rc
275 mount_after_interval() {
276 local mdt_interval=$1
277 local ost_interval=$2
280 mount_after_interval_sub $mdt_interval $MMP_MDSDEV $MMP_MDS \
281 $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
284 mount_after_interval_sub $ost_interval $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
286 if [ $rc -ne 0 ]; then
294 # Mount the shared target on the failover server
295 # during unmounting it on the primary server.
296 mount_during_unmount() {
302 local failover_facet=$(get_failover_facet $facet)
308 log "Mounting $device on $facet..."
309 start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
311 log "Unmounting $device on $facet..."
315 log "Mounting $device on $failover_facet..."
316 start $failover_facet $device $mnt_opts
317 mount_rc=${PIPESTATUS[0]}
320 unmount_rc=${PIPESTATUS[0]}
322 if [ $mount_rc -eq 0 ]; then
323 error_noexit "mount during unmount of the first filesystem should fail"
324 stop $failover_facet || return ${PIPESTATUS[0]}
328 if [ $unmount_rc -ne 0 ]; then
329 error_noexit "unmount the $device on $facet should succeed"
336 # Mount the shared target on the failover server
337 # after clean unmounting it on the primary server.
338 mount_after_unmount() {
344 local failover_facet=$(get_failover_facet $facet)
346 log "Mounting $device on $facet..."
347 start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
349 log "Unmounting $device on $facet..."
350 stop $facet || return ${PIPESTATUS[0]}
352 log "Mounting $device on $failover_facet..."
353 start $failover_facet $device $mnt_opts || return ${PIPESTATUS[0]}
358 # Mount the shared target on the failover server after rebooting
359 # the primary server.
360 mount_after_reboot() {
366 local failover_facet=$(get_failover_facet $facet)
369 log "Mounting $device on $facet..."
370 start $facet $device $mnt_opts || return ${PIPESTATUS[0]}
372 if [ "$FAILURE_MODE" = "HARD" ]; then
373 shutdown_facet $facet
375 wait_for_facet $facet
377 replay_barrier_nodf $facet
380 log "Mounting $device on $failover_facet..."
381 start $failover_facet $device $mnt_opts
383 if [ $rc -ne 0 ]; then
384 error_noexit "mount $device on $failover_facet should succeed"
385 stop $facet || return ${PIPESTATUS[0]}
392 # Run e2fsck on the Lustre server target.
400 log "Running e2fsck on the device $device on $facet..."
401 do_facet $facet "$E2FSCK $opts $device"
402 return ${PIPESTATUS[0]}
405 # Run delayed e2fsck on the Lustre server target.
411 do_facet $facet "$LUSTRE/tests/e2fsck.exp $device"
412 return ${PIPESTATUS[0]}
415 # Check whether there are failover pairs for MDS and OSS servers.
416 check_failover_pair() {
417 [ "$MMP_MDS" = "$MMP_MDS_FAILOVER" -o "$MMP_OSS" = "$MMP_OSS_FAILOVER" ] \
418 && { skip_env "failover pair is needed" && return 1; }
424 # Test 1 - two mounts at the same time.
426 check_failover_pair || return 0
428 mount_after_interval 0 0 || return ${PIPESTATUS[0]}
429 stop_services primary || return ${PIPESTATUS[0]}
431 run_test 1 "two mounts at the same time"
433 # Test 2 - one mount delayed by mmp update interval.
435 check_failover_pair || return 0
437 local mdt_interval=$(get_mmp_update_interval $MMP_MDS $MMP_MDSDEV)
438 local ost_interval=$(get_mmp_update_interval $MMP_OSS $MMP_OSTDEV)
440 mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
441 stop_services primary || return ${PIPESTATUS[0]}
443 run_test 2 "one mount delayed by mmp update interval"
445 # Test 3 - one mount delayed by 2x mmp check interval.
447 check_failover_pair || return 0
449 local mdt_interval=$(get_mmp_check_interval $MMP_MDS $MMP_MDSDEV)
450 local ost_interval=$(get_mmp_check_interval $MMP_OSS $MMP_OSTDEV)
452 mdt_interval=$((2 * $mdt_interval + 1))
453 ost_interval=$((2 * $ost_interval + 1))
455 mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
456 stop_services primary || return ${PIPESTATUS[0]}
458 run_test 3 "one mount delayed by 2x mmp check interval"
460 # Test 4 - one mount delayed by > 2x mmp check interval.
462 check_failover_pair || return 0
464 local mdt_interval=$(get_mmp_check_interval $MMP_MDS $MMP_MDSDEV)
465 local ost_interval=$(get_mmp_check_interval $MMP_OSS $MMP_OSTDEV)
467 mdt_interval=$((4 * $mdt_interval))
468 ost_interval=$((4 * $ost_interval))
470 mount_after_interval $mdt_interval $ost_interval || return ${PIPESTATUS[0]}
471 stop_services primary || return ${PIPESTATUS[0]}
473 run_test 4 "one mount delayed by > 2x mmp check interval"
475 # Test 5 - mount during unmount of the first filesystem.
478 check_failover_pair || return 0
480 mount_during_unmount $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
481 return ${PIPESTATUS[0]}
484 start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
485 mount_during_unmount $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
487 if [ $rc -ne 0 ]; then
488 stop $MMP_MDS || return ${PIPESTATUS[0]}
492 stop $MMP_MDS || return ${PIPESTATUS[0]}
494 run_test 5 "mount during unmount of the first filesystem"
496 # Test 6 - mount after clean unmount.
499 check_failover_pair || return 0
501 mount_after_unmount $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
502 return ${PIPESTATUS[0]}
505 mount_after_unmount $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
507 if [ $rc -ne 0 ]; then
508 stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
512 stop_services failover || return ${PIPESTATUS[0]}
514 run_test 6 "mount after clean unmount"
516 # Test 7 - mount after reboot.
519 check_failover_pair || return 0
521 mount_after_reboot $MMP_MDSDEV $MMP_MDS $MDS_MOUNT_OPTS || \
522 return ${PIPESTATUS[0]}
525 mount_after_reboot $MMP_OSTDEV $MMP_OSS $OST_MOUNT_OPTS
527 if [ $rc -ne 0 ]; then
528 stop $MMP_MDS || return ${PIPESTATUS[0]}
529 stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
533 stop_services failover || return ${PIPESTATUS[0]}
534 stop_services primary || return ${PIPESTATUS[0]}
536 run_test 7 "mount after reboot"
538 # Test 8 - mount during e2fsck (should never succeed).
542 log "Force e2fsck checking on device $MMP_MDSDEV on $MMP_MDS"
543 do_facet $MMP_MDS "$DEBUGFS -w -R 'ssv free_blocks_count 0' $MMP_MDSDEV"
544 run_delay_e2fsck $MMP_MDS $MMP_MDSDEV &
548 if start $MMP_MDS_FAILOVER $MMP_MDSDEV $MDS_MOUNT_OPTS; then
550 "mount $MMP_MDSDEV on $MMP_MDS_FAILOVER should fail"
551 stop $MMP_MDS_FAILOVER || return ${PIPESTATUS[0]}
558 log "Force e2fsck checking on device $MMP_OSTDEV on $MMP_OSS"
559 do_facet $MMP_OSS "$DEBUGFS -w -R 'ssv free_blocks_count 0' $MMP_OSTDEV"
560 run_delay_e2fsck $MMP_OSS $MMP_OSTDEV &
564 if start $MMP_OSS_FAILOVER $MMP_OSTDEV $OST_MOUNT_OPTS; then
566 "mount $MMP_OSTDEV on $MMP_OSS_FAILOVER should fail"
567 stop $MMP_OSS_FAILOVER || return ${PIPESTATUS[0]}
574 run_test 8 "mount during e2fsck"
576 # Test 9 - mount after aborted e2fsck (should never succeed).
578 start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
579 if ! start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS; then
580 local rc=${PIPESTATUS[0]}
581 stop $MMP_MDS || return ${PIPESTATUS[0]}
584 stop_services primary || return ${PIPESTATUS[0]}
586 mark_mmp_block $MMP_MDS $MMP_MDSDEV || return ${PIPESTATUS[0]}
588 log "Mounting $MMP_MDSDEV on $MMP_MDS..."
589 if start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS; then
590 error_noexit "mount $MMP_MDSDEV on $MMP_MDS should fail"
591 stop $MMP_MDS || return ${PIPESTATUS[0]}
595 reset_mmp_block $MMP_MDS $MMP_MDSDEV || return ${PIPESTATUS[0]}
597 mark_mmp_block $MMP_OSS $MMP_OSTDEV || return ${PIPESTATUS[0]}
599 log "Mounting $MMP_OSTDEV on $MMP_OSS..."
600 if start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS; then
601 error_noexit "mount $MMP_OSTDEV on $MMP_OSS should fail"
602 stop $MMP_OSS || return ${PIPESTATUS[0]}
606 reset_mmp_block $MMP_OSS $MMP_OSTDEV || return ${PIPESTATUS[0]}
609 run_test 9 "mount after aborted e2fsck"
611 # Test 10 - e2fsck with mounted filesystem.
615 log "Mounting $MMP_MDSDEV on $MMP_MDS..."
616 start $MMP_MDS $MMP_MDSDEV $MDS_MOUNT_OPTS || return ${PIPESTATUS[0]}
618 run_e2fsck $MMP_MDS_FAILOVER $MMP_MDSDEV "-fn"
621 # e2fsck is called with -n option (Open the filesystem read-only), so
622 # 0 (No errors) and 4 (File system errors left uncorrected) are the only
623 # acceptable exit codes in this case
624 if [ $rc -ne 0 ] && [ $rc -ne 4 ]; then
625 error_noexit "e2fsck $MMP_MDSDEV on $MMP_MDS_FAILOVER returned $rc"
626 stop $MMP_MDS || return ${PIPESTATUS[0]}
630 log "Mounting $MMP_OSTDEV on $MMP_OSS..."
631 start $MMP_OSS $MMP_OSTDEV $OST_MOUNT_OPTS
633 if [ $rc -ne 0 ]; then
634 stop $MMP_MDS || return ${PIPESTATUS[0]}
638 run_e2fsck $MMP_OSS_FAILOVER $MMP_OSTDEV "-fn"
640 if [ $rc -ne 0 ] && [ $rc -ne 4 ]; then
641 error_noexit "e2fsck $MMP_OSTDEV on $MMP_OSS_FAILOVER returned $rc"
644 stop_services primary || return ${PIPESTATUS[0]}
647 run_test 10 "e2fsck with mounted filesystem"
650 FAIL_ON_ERROR=$SAVED_FAIL_ON_ERROR
652 complete $(basename $0) $SECONDS
653 $MMP_RESTORE_MOUNT && setupall