#!/bin/bash
# vim:expandtab:shiftwidth=4:softtabstop=4:tabstop=4:
-trap 'print_summary && echo "test-framework exiting on error"' ERR
+trap 'print_summary && touch $TF_FAIL && \
+ echo "test-framework exiting on error"' ERR
set -e
#set -x
-
export REFORMAT=${REFORMAT:-""}
export WRITECONF=${WRITECONF:-""}
export VERBOSE=false
. $EXCEPT_LIST_FILE
fi
+[ -z "$MODPROBECONF" -a -f /etc/modprobe.conf ] && MODPROBECONF=/etc/modprobe.conf
+[ -z "$MODPROBECONF" -a -f /etc/modprobe.d/Lustre ] && MODPROBECONF=/etc/modprobe.d/Lustre
+
assert_DIR () {
local failed=""
[[ $DIR/ = $MOUNT/* ]] || \
/sbin/lsmod | grep -q $1
}
+# Load a module on the system where this is running.
+#
+# Synopsis: load_module module_name [module arguments for insmod/modprobe]
+#
+# If module arguments are not given but MODOPTS_<MODULE> is set, then its value
+# will be used as the arguments. Otherwise arguments will be obtained from
+# /etc/modprobe.conf, from /etc/modprobe.d/Lustre, or else none will be used.
+#
load_module() {
+ local optvar
EXT=".ko"
module=$1
shift
module_loaded ${BASE} && return
+ # If no module arguments were passed, get them from $MODOPTS_<MODULE>, else from
+ # modprobe.conf
+ if [ $# -eq 0 ]; then
+ # $MODOPTS_<MODULE>; we could use associative arrays, but that's not in
+ # Bash until 4.x, so we resort to eval.
+ optvar="MODOPTS_$(basename $module | tr a-z A-Z)"
+ eval set -- \$$optvar
+ if [ $# -eq 0 -a -n "$MODPROBECONF" ]; then
+ # Nothing in $MODOPTS_<MODULE>; try modprobe.conf
+ set -- $(grep "^options\\s*\<${module}\>" $MODPROBECONF)
+ # Get rid of "options $module"
+ (($# > 0)) && shift 2
+
+ # Ensure we have accept=all for lnet
+ if [ $(basename $module) = lnet ]; then
+ # OK, this is a bit wordy...
+ local arg accept_all_present=false
+ for arg in "$@"; do
+ [ "$arg" = accept=all ] && accept_all_present=true
+ done
+ $accept_all_present || set -- "$@" accept=all
+ fi
+ fi
+ fi
+
+ [ $# -gt 0 ] && echo "${module} options: '$*'"
+
+ # Note that insmod will ignore anything in modprobe.conf, which is why we're
+ # passing options on the command-line.
if [ "$BASE" == "lnet_selftest" ] && \
[ -f ${LUSTRE}/../lnet/selftest/${module}${EXT} ]; then
insmod ${LUSTRE}/../lnet/selftest/${module}${EXT}
-
elif [ -f ${LUSTRE}/${module}${EXT} ]; then
- insmod ${LUSTRE}/${module}${EXT} $@
+ insmod ${LUSTRE}/${module}${EXT} "$@"
else
# must be testing a "make install" or "rpm" installation
# note failed to load ptlrpc_gss is considered not fatal
if [ "$BASE" == "ptlrpc_gss" ]; then
- modprobe $BASE $@ 2>/dev/null || echo "gss/krb5 is not supported"
+ modprobe $BASE "$@" 2>/dev/null || echo "gss/krb5 is not supported"
else
- modprobe $BASE $@
+ modprobe $BASE "$@"
fi
fi
}
load_modules_local() {
if [ -n "$MODPROBE" ]; then
# use modprobe
- return 0
- fi
- if [ "$HAVE_MODULES" = true ]; then
- # we already loaded
+ echo "Using modprobe to load modules"
return 0
fi
- HAVE_MODULES=true
echo Loading modules from $LUSTRE
load_module ../libcfs/libcfs/libcfs
[ "$PTLDEBUG" ] && lctl set_param debug="$PTLDEBUG"
[ "$SUBSYSTEM" ] && lctl set_param subsystem_debug="${SUBSYSTEM# }"
- local MODPROBECONF=
- [ -f /etc/modprobe.conf ] && MODPROBECONF=/etc/modprobe.conf
- [ ! "$MODPROBECONF" -a -d /etc/modprobe.d ] && MODPROBECONF=/etc/modprobe.d/Lustre
- [ -z "$LNETOPTS" -a "$MODPROBECONF" ] && \
- LNETOPTS=$(awk '/^options lnet/ { print $0}' $MODPROBECONF | sed 's/^options lnet //g')
- echo $LNETOPTS | grep -q "accept=all" || LNETOPTS="$LNETOPTS accept=all";
- echo "lnet options: '$LNETOPTS'"
- # note that insmod will ignore anything in modprobe.conf
- load_module ../lnet/lnet/lnet $LNETOPTS
+ load_module ../lnet/lnet/lnet
LNETLND=${LNETLND:-"socklnd/ksocklnd"}
load_module ../lnet/klnds/$LNETLND
load_module lvfs/lvfs
fi
fi
- HAVE_MODULES=false
-
check_mem_leak || return 254
echo "modules unloaded."
local list=$1
dname=$2
- do_nodes --verbose $list "num=\\\$(ps -o cmd -C $dname | grep $dname | wc -l);
+ do_nodesv $list "num=\\\$(ps -o cmd -C $dname | grep $dname | wc -l);
if [ \\\"\\\$num\\\" -ne 1 ]; then
echo \\\$num instance of $dname;
exit 1;
fi
}
+remount_facet() {
+ local facet=$1
+
+ stop $facet
+ mount_facet $facet
+}
+
reboot_facet() {
facet=$1
if [ "$FAILURE_MODE" = HARD ]; then
testnum=$((nodenum % numloads))
start_client_load ${clients[nodenum]} ${CLIENT_LOADS[testnum]}
done
+ # bug 22169: wait the background threads to start
+ sleep 2
}
# only for remote client
local facet=$1
# Use default policy if $2 is not passed by caller.
- #define OBD_RECOVERY_TIMEOUT (obd_timeout * 5 / 2)
- # as we are in process of changing obd_timeout in different ways
- # let's set MAX longer than that
- local MAX=${2:-$(( TIMEOUT * 4 ))}
+ local MAX=${2:-$(max_recovery_time)}
local var_svc=${facet}_svc
local procfile="*.${!var_svc}.recovery_status"
return ${PIPESTATUS[0]}
}
+do_nodev() {
+ do_node --verbose "$@"
+}
+
single_local_node () {
[ "$1" = "$HOSTNAME" ]
}
+# Outputs environment variable assignments that should be passed to remote nodes
+get_env_vars() {
+ local var
+ local value
+
+ for var in ${!MODOPTS_*}; do
+ value=${!var}
+ echo "${var}=\"$value\""
+ done
+}
+
do_nodes() {
local verbose=false
# do not stripe off hostname if verbose, bug 19215
if single_local_node $rnodes; then
if $verbose; then
- do_node --verbose $rnodes $@
+ do_nodev $rnodes "$@"
else
- do_node $rnodes $@
+ do_node $rnodes "$@"
fi
return $?
fi
fi
if $verbose ; then
- $myPDSH $rnodes "(PATH=\$PATH:$RLUSTRE/utils:$RLUSTRE/tests:/sbin:/usr/sbin; cd $RPWD; LUSTRE=\"$RLUSTRE\" sh -c \"$@\")"
+ $myPDSH $rnodes "(PATH=\$PATH:$RLUSTRE/utils:$RLUSTRE/tests:/sbin:/usr/sbin; cd $RPWD; LUSTRE=\"$RLUSTRE\" $(get_env_vars) sh -c \"$@\")"
else
- $myPDSH $rnodes "(PATH=\$PATH:$RLUSTRE/utils:$RLUSTRE/tests:/sbin:/usr/sbin; cd $RPWD; LUSTRE=\"$RLUSTRE\" sh -c \"$@\")" | sed -re "s/\w+:\s//g"
+ $myPDSH $rnodes "(PATH=\$PATH:$RLUSTRE/utils:$RLUSTRE/tests:/sbin:/usr/sbin; cd $RPWD; LUSTRE=\"$RLUSTRE\" $(get_env_vars) sh -c \"$@\")" | sed -re "s/\w+:\s//g"
fi
return ${PIPESTATUS[0]}
}
do_node $HOST "$@"
}
+do_nodesv() {
+ do_nodes --verbose "$@"
+}
+
add() {
local facet=$1
shift
rm -f $TMP/ost${num}active
done
+ if ! combined_mgs_mds ; then
+ stop mgs
+ fi
+
return 0
}
test $nr = 1 && echo -n $MDS_MKFS_OPTS || echo -n $MDSn_MKFS_OPTS
}
+combined_mgs_mds () {
+ [[ $MDSDEV1 = $MGSDEV ]] && [[ $mds1_HOST = $mgs_HOST ]]
+}
+
formatall() {
if [ "$IAMDIR" == "yes" ]; then
MDS_MKFS_OPTS="$MDS_MKFS_OPTS --iam-dir"
load_modules
[ "$CLIENTONLY" ] && return
echo Formatting mgs, mds, osts
- if [[ $MDSDEV1 != $MGSDEV ]] || [[ $mds1_HOST != $mgs_HOST ]]; then
+ if ! combined_mgs_mds ; then
add mgs $mgs_MKFS_OPTS $FSTYPE_OPT --reformat $MGSDEV || exit 10
fi
do_facet mds$num "lctl set_param -n mdt.$MDT.identity_upcall \"NONE\""
fi
- do_facet mds$num "lctl set_param -n mdt/$MDT/identity_flush \"-1\""
+ do_facet mds$num "lctl set_param -n mdt/$MDT/identity_flush=-1"
if [ $old = "NONE" ]; then
return 1
echo Setup mgs, mdt, osts
echo $WRITECONF | grep -q "writeconf" && \
writeconf_all
- if [[ $mds1_HOST != $mgs_HOST ]] || [[ $MDSDEV1 != $MGSDEV ]]; then
+ if ! combined_mgs_mds ; then
start mgs $MGSDEV $mgs_MOUNT_OPTS
fi
[ $period -lt $timeout ] || log "$count OST are inactive after $timeout seconds, give up"
}
-som_check() {
- SOM_ENABLED=$(do_facet $SINGLEMDS "$LCTL get_param mdt.*.som" | awk -F= ' {print $2}' | head -n 1)
- echo $SOM_ENABLED
-}
-
init_param_vars () {
if ! remote_ost_nodsh && ! remote_mds_nodsh; then
export MDSVER=$(do_facet $SINGLEMDS "lctl get_param version" | cut -d. -f1,2)
osc_ensure_active $SINGLEMDS M $TIMEOUT
osc_ensure_active client c $TIMEOUT
- if [ x"$(som_check)" = x"enabled" ]; then
- ENABLE_QUOTA=""
- echo "disable quota temporary when SOM enabled"
- fi
if [ $QUOTA_AUTO -ne 0 ]; then
if [ "$ENABLE_QUOTA" ]; then
echo "enable quota as required"
is_mounted () {
local mntpt=$1
+ [ -z $mntpt ] && return 1
local mounted=$(mounted_lustre_filesystems)
echo $mounted' ' | grep -w -q $mntpt' '
return 1
fi
done
- if [[ $MDSDEV1 != $MGSDEV ]]; then
- stop mgs
- fi
-
return 0
}
error() {
error_noexit "$@"
- if $FAIL_ON_ERROR; then
- reset_fail_loc
- exit 1
- fi
+ exit 1
}
error_exit() {
- error_noexit "$@"
- exit 1
+ error "$@"
}
# use only if we are ignoring failures for this test, bugno required.
# print a newline if the last test was skipped
export LAST_SKIPPED=
+#
+# Main entry into test-framework. This is called with the name and
+# description of a test. The name is used to find the function to run
+# the test using "test_$name".
+#
+# This supports a variety of methods of specifying specific test to
+# run or not run. These need to be documented...
+#
run_test() {
assert_DIR
return $?
}
-EQUALS="======================================================================"
equals_msg() {
- msg="$@"
-
- local suffixlen=$((${#EQUALS} - ${#msg}))
- [ $suffixlen -lt 5 ] && suffixlen=5
- log `echo $(printf '===== %s %.*s\n' "$msg" $suffixlen $EQUALS)`
+ banner "$*"
}
log() {
echo done.
}
+
+#
+# Log a message (on all nodes) padded with "=" before and after.
+# Also appends a timestamp and prepends the testsuite name.
+#
+
+EQUALS="===================================================================================================="
+banner() {
+ msg="== ${TESTSUITE} $*"
+ last=${msg: -1:1}
+ [[ $last != "=" && $last != " " ]] && msg="$msg "
+ msg=$(printf '%s%.*s' "$msg" $((${#EQUALS} - ${#msg})) $EQUALS )
+ # always include at least == after the message
+ log "$msg== $(date +"%H:%M:%S (%s)")"
+}
+
+#
+# Run a single test function and cleanup after it.
+#
+# This function should be run in a subshell so the test func can
+# exit() without stopping the whole script.
+#
run_one() {
local testnum=$1
local message=$2
- local start_tm=$3
tfile=f${testnum}
export tdir=d0.${TESTSUITE}/d${base}
export TESTNAME=test_$testnum
local SAVE_UMASK=`umask`
umask 0022
- log "== test $testnum: $message == `date +%H:%M:%S` ($start_tm)"
+ banner "test $testnum: $message"
test_${testnum} || error "test_$testnum failed with $?"
cd $SAVE_PWD
reset_fail_loc
return 0
}
+#
+# Wrapper around run_one to ensure:
+# - test runs in subshell
+# - output of test is saved to separate log file for error reporting
+# - test result is saved to data file
+#
run_one_logged() {
local BEFORE=`date +%s`
local TEST_ERROR
rm -rf $LOGDIR/err
echo
- run_one $1 "$2" $BEFORE 2>&1 | tee $test_log
+ log_sub_test_begin test_${1}
+ (run_one $1 "$2") 2>&1 | tee $test_log
local RC=${PIPESTATUS[0]}
[ $RC -ne 0 ] && [ ! -f $LOGDIR/err ] && \
duration=$((`date +%s` - $BEFORE))
pass "(${duration}s)"
[ -f $LOGDIR/err ] && TEST_ERROR=$(cat $LOGDIR/err)
- log_sub_test test_${1} $TEST_STATUS $duration "$RC" "$TEST_ERROR"
+ log_sub_test_end $TEST_STATUS $duration "$RC" "$TEST_ERROR"
if [ -f $LOGDIR/err ]; then
$FAIL_ON_ERROR && exit $RC
generate_machine_file() {
local nodes=${1//,/ }
local machinefile=$2
- rm -f $machinefile || error "can't rm $machinefile"
+ rm -f $machinefile
for node in $nodes; do
- echo $node >>$machinefile
+ echo $node >>$machinefile || \
+ { echo "can not generate machinefile $machinefile" && return 1; }
done
}
rm -f $file
}
+setstripe_nfsserver () {
+ local dir=$1
+
+ local nfsserver=$(awk '"'$dir'" ~ $2 && $3 ~ "nfs" && $2 != "/" \
+ { print $1 }' /proc/mounts | cut -f 1 -d : | head -1)
+
+ [ -z $nfsserver ] && echo "$dir is not nfs mounted" && return 1
+
+ do_nodev $nfsserver lfs setstripe "$@"
+}
+
check_runas_id_ret() {
local myRC=0
local myRUNAS_UID=$1
echo $IFree
}
+mdsrate_inodes_available () {
+ echo $(($(inodes_available) - 1))
+}
+
# reset llite stat counters
clear_llite_stats(){
lctl set_param -n llite.*.stats 0
# generate a stream of formatted strings (<node> <param name>=<param value>)
save_lustre_params() {
local s
- do_nodes --verbose $1 "lctl get_param $2 | while read s; do echo \\\$s; done"
+ do_nodesv $1 "lctl get_param $2 | while read s; do echo \\\$s; done"
}
# restore lustre parameters from input stream, produces by save_lustre_params
# Add paths to lustre tests for 32 and 64 bit systems.
local RPATH="$RLUSTRE/tests:/usr/lib/lustre/tests:/usr/lib64/lustre/tests:$PATH"
- do_nodes --verbose $list "PATH=$RPATH sh rpc.sh $@ "
+ do_nodesv $list "PATH=$RPATH sh rpc.sh $@ "
}
wait_clients_import_state () {
return
fi
- do_nodes --verbose $list \
+ do_nodesv $list \
"$LCTL dk > ${prefix}.debug_log.\\\$(hostname).${suffix};
dmesg > ${prefix}.dmesg.\\\$(hostname).${suffix}"
if [ ! -f $LOGDIR/shared ]; then
return $rc
}
+# target_start_and_reset_recovery_timer()
+# service_time = at_est2timeout(service_time);
+# service_time += 2 * (CONNECTION_SWITCH_MAX + CONNECTION_SWITCH_INC +
+# INITIAL_CONNECT_TIMEOUT);
+# CONNECTION_SWITCH_MAX : min(25U, max(CONNECTION_SWITCH_MIN,obd_timeout))
+#define CONNECTION_SWITCH_INC 1
+#define INITIAL_CONNECT_TIMEOUT max(CONNECTION_SWITCH_MIN,obd_timeout/20)
+#define CONNECTION_SWITCH_MIN 5U
+
+max_recovery_time () {
+ local init_connect_timeout=$(( TIMEOUT / 20 ))
+ [[ $init_connect_timeout > 5 ]] || init_connect_timeout=5
+
+ local service_time=$(( $(at_max_get client) + $(( 2 * $(( 25 + 1 + init_connect_timeout)) )) ))
+
+ echo $service_time
+}
+
get_clients_mount_count () {
local clients=${CLIENTS:-`hostname`}
yml_log_test $1 >> $YAML_LOG
}
-log_sub_test() {
- yml_log_sub_test $@ >> $YAML_LOG
+log_test_status() {
+ yml_log_test_status $@ >> $YAML_LOG
+}
+
+log_sub_test_begin() {
+ yml_log_sub_test_begin $@ >> $YAML_LOG
+}
+
+log_sub_test_end() {
+ yml_log_sub_test_end $@ >> $YAML_LOG
}
+run_llverdev()
+{
+ local dev=$1
+ local devname=$(basename $1)
+ local size=$(grep "$devname"$ /proc/partitions | awk '{print $3}')
+ # loop devices aren't in /proc/partitions
+ [ "x$size" == "x" ] && local size=$(ls -l $dev | awk '{print $5}')
+
+ size=$(($size / 1024 / 1024)) # Gb
+
+ local partial_arg=""
+ # Run in partial (fast) mode if the size
+ # of a partition > 10 GB
+ [ $size -gt 10 ] && partial_arg="-p"
+
+ llverdev --force $partial_arg $dev
+}