X-Git-Url: https://git.whamcloud.com/?a=blobdiff_plain;f=lustre%2Ftests%2Fracer.sh;h=892e9eae7927adefb4b6fc11637319513aa8f878;hb=d292fb12a0bdcb3d8dae22767929b20b10d1197e;hp=f862012e357a8036cf8e272a339126b8c1e24f26;hpb=e4cf956f93a4384d19ea73e601a6651710703492;p=fs%2Flustre-release.git diff --git a/lustre/tests/racer.sh b/lustre/tests/racer.sh index f862012..892e9ea 100644 --- a/lustre/tests/racer.sh +++ b/lustre/tests/racer.sh @@ -1,3 +1,183 @@ #!/bin/bash +#set -vx +set -e -bash $(dirname $0)/runracer $@ +ONLY=${ONLY:-"$*"} +LUSTRE=${LUSTRE:-$(cd $(dirname $0)/..; echo $PWD)} +. $LUSTRE/tests/test-framework.sh +init_test_env $@ +. ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh} +init_logging + +racer=$LUSTRE/tests/racer/racer.sh +echo racer: $racer with $MDSCOUNT MDTs + +if [ "$SLOW" = "no" ]; then + DURATION=${DURATION:-300} +else + DURATION=${DURATION:-900} +fi +MOUNT_2=${MOUNT_2:-"yes"} + +build_test_filter +check_and_setup_lustre + +CLIENTS=${CLIENTS:-$HOSTNAME} +RACERDIRS=${RACERDIRS:-"$DIR $DIR2"} +echo RACERDIRS=$RACERDIRS + +RACER_FAILOVER=${RACER_FAILOVER:-false} +FAIL_TARGETS=${FAIL_TARGETS:-"MDS OST"} +RACER_FAILOVER_PERIOD=${RACER_FAILOVER_PERIOD:-60} + +if $RACER_FAILOVER; then + declare -a victims + for target in $FAIL_TARGETS; do + victims=(${victims[@]} $(get_facets $target)) + done + echo Victim facets ${victims[@]} +fi + +#LU-4684 +RACER_ENABLE_MIGRATION=false + +if ((MDSCOUNT > 1 && "$MDS1_VERSION" >= $(version_code 2.8.0))); then + RACER_ENABLE_REMOTE_DIRS=${RACER_ENABLE_REMOTE_DIRS:-true} + RACER_ENABLE_STRIPED_DIRS=${RACER_ENABLE_STRIPED_DIRS:-true} + RACER_ENABLE_MIGRATION=${RACER_ENABLE_MIGRATION:-true} +elif ((MDSCOUNT > 1 && "$MDS1_VERSION" >= $(version_code 2.5.0))); then + RACER_ENABLE_REMOTE_DIRS=${RACER_ENABLE_REMOTE_DIRS:-true} +fi + +[[ "$MDS1_VERSION" -lt $(version_code 2.9.54) || + $(facet_fstype mgs) != zfs ]] && RACER_ENABLE_SNAPSHOT=false + +[[ "$MDS1_VERSION" -le $(version_code 2.9.55) ]] && + RACER_ENABLE_PFL=false + +[[ "$MDS1_VERSION" -le $(version_code 2.10.53) ]] && + RACER_ENABLE_DOM=false + +[[ "$MDS1_VERSION" -lt $(version_code 2.10.55) ]] && + RACER_ENABLE_FLR=false + +RACER_ENABLE_REMOTE_DIRS=${RACER_ENABLE_REMOTE_DIRS:-false} +RACER_ENABLE_STRIPED_DIRS=${RACER_ENABLE_STRIPED_DIRS:-false} +RACER_ENABLE_MIGRATION=${RACER_ENABLE_MIGRATION:-false} +RACER_ENABLE_SNAPSHOT=${RACER_ENABLE_SNAPSHOT:-true} +RACER_ENABLE_PFL=${RACER_ENABLE_PFL:-true} +RACER_ENABLE_DOM=${RACER_ENABLE_DOM:-true} +RACER_ENABLE_FLR=${RACER_ENABLE_FLR:-true} + +fail_random_facet () { + local facets=${victims[@]} + facets=${facets// /,} + + sleep $RACER_FAILOVER_PERIOD + while [ ! -f $racer_done ]; do + local facet=$(get_random_entry $facets) + facet_failover $facet + sleep $RACER_FAILOVER_PERIOD + done +} + +# run racer +test_1() { + local rrc=0 + local rc=0 + local clients=$CLIENTS + local RDIRS + local i + local racer_done=$TMP/racer_done + + rm -f $racer_done + + for d in ${RACERDIRS}; do + is_mounted $d || continue + + RDIRS="$RDIRS $d/racer" + mkdir -p $d/racer + # lfs setstripe $d/racer -c -1 + if [ $MDSCOUNT -ge 2 ]; then + for i in $(seq $((MDSCOUNT - 1))); do + RDIRS="$RDIRS $d/racer$i" + if [ ! -e $d/racer$i ]; then + $LFS mkdir -i $i $d/racer$i || + error "lfs mkdir $i failed" + fi + done + fi + done + + local rpids="" + for rdir in $RDIRS; do + do_nodes $clients "DURATION=$DURATION \ + MDSCOUNT=$MDSCOUNT OSTCOUNT=$OSTCOUNT\ + RACER_ENABLE_REMOTE_DIRS=$RACER_ENABLE_REMOTE_DIRS \ + RACER_ENABLE_STRIPED_DIRS=$RACER_ENABLE_STRIPED_DIRS \ + RACER_ENABLE_MIGRATION=$RACER_ENABLE_MIGRATION \ + RACER_ENABLE_PFL=$RACER_ENABLE_PFL \ + RACER_ENABLE_DOM=$RACER_ENABLE_DOM \ + RACER_ENABLE_FLR=$RACER_ENABLE_FLR \ + RACER_MAX_CLEANUP_WAIT=$RACER_MAX_CLEANUP_WAIT \ + LFS=$LFS \ + LCTL=$LCTL \ + $racer $rdir $NUM_RACER_THREADS" & + pid=$! + rpids="$rpids $pid" + done + + local failpid="" + if $RACER_FAILOVER; then + fail_random_facet & + failpid=$! + echo racers failpid: $failpid + fi + + local lss_pids="" + if $RACER_ENABLE_SNAPSHOT; then + lss_gen_conf + + $LUSTRE/tests/racer/lss_create.sh & + pid=$! + lss_pids="$lss_pids $pid" + + $LUSTRE/tests/racer/lss_destroy.sh & + pid=$! + lss_pids="$lss_pids $pid" + fi + + echo racers pids: $rpids + for pid in $rpids; do + wait $pid + rc=$? + echo "pid=$pid rc=$rc" + if [ $rc != 0 ]; then + rrc=$((rrc + 1)) + fi + done + + if $RACER_FAILOVER; then + touch $racer_done + wait $failpid + rrc=$((rrc + $?)) + fi + + if $RACER_ENABLE_SNAPSHOT; then + killall -q lss_create.sh + killall -q lss_destroy.sh + + for pid in $lss_pids; do + wait $pid + done + + lss_cleanup + fi + + return $rrc +} +run_test 1 "racer on clients: ${CLIENTS:-$(hostname)} DURATION=$DURATION" + +complete $SECONDS +check_and_cleanup_lustre +exit_status