X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Ftests%2Fobdfilter-survey.sh;h=94a5182f620619b742b9060fc8afd8321f10717c;hp=1e1284b0978dfbae4a4a0c50c019bda5053a43cd;hb=e3d507eec50fc1ff79acf2a9f93d52d698c887d7;hpb=cec72a356891eaa729314a7bc89c4b2aaef0a31b diff --git a/lustre/tests/obdfilter-survey.sh b/lustre/tests/obdfilter-survey.sh index 1e1284b..94a5182 100644 --- a/lustre/tests/obdfilter-survey.sh +++ b/lustre/tests/obdfilter-survey.sh @@ -5,7 +5,6 @@ set -e LUSTRE=${LUSTRE:-`dirname $0`/..} . $LUSTRE/tests/test-framework.sh init_test_env $@ -init_logging nobjhi=${nobjhi:-1} thrhi=${thrhi:-16} @@ -13,6 +12,7 @@ size=${size:-1024} # the summary file a bit smaller than OSTSIZE . ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh} +init_logging [ "$SLOW" = no ] && { nobjhi=1; thrhi=4; } thrlo=${thrlo:-$(( thrhi / 2))} @@ -33,17 +33,24 @@ if [ $(( size * 1024 )) -ge $minsize ]; then echo min kbytesavail: $minsize using size=${size} MBytes per obd instance fi +get_devs() { + echo $(do_nodes $1 'lctl dl | grep obdfilter' | \ + awk '{print $4}' | sort -u) +} + get_targets () { local targets local devs + local nid local oss for oss in $(osts_nodes); do - devs=$(do_node $oss "lctl dl |grep obdfilter |sort" | awk '{print $4}') + devs=$(get_devs $oss) + nid=$(host_nids_address $oss $NETTYPE) for d in $devs; do # if oss is local -- obdfilter-survey needs dev wo/ host target=$d - [[ $oss = `hostname` ]] || target=$oss:$target + [[ $oss = `hostname` && "$1" == "disk" ]] || target=$nid:$target targets="$targets $target" done done @@ -56,9 +63,9 @@ obdflter_survey_targets () { local targets case $case in - disk) targets=$(get_targets);; - netdisk) targets=$(get_targets);; - network) targets="$(osts_nodes)";; + disk) targets=$(get_targets $case);; + netdisk) targets=$(get_targets $case);; + network) targets=$(host_nids_address $(comma_list $(osts_nodes)) $NETTYPE);; *) error "unknown obdflter-survey case!" ;; esac echo $targets @@ -87,7 +94,7 @@ print_jbd () { local varsvc=${facet}_svc local dev=$(ldiskfs_canon "*.${!varsvc}.mntdev" $facet) - # ext4: /proc/fs/jbd2/sda1:8/history + # ext4: /proc/fs/jbd2/sda1:8/history # ext3: /proc/fs/jbd/sdb1/history do_facet $facet cat /proc/fs/jbd*/${dev}*/$file @@ -96,11 +103,14 @@ print_jbd () { check_jbd_values () { local facet=$1 local thrhi=$2 + local rtime=$3 # last two lines from history # $4: run >= 5000 # $8: hndls >= thrhi * 2 - local hist=("$(print_jbd history $facet | tail -3 | head -2)") + # display history of rtime/4 before, in case obd cleanup consumes time + local tlines=$((rtime / 5 / 4 + 1)) + local hist=("$(print_jbd history $facet | tail -$tlines | head -n1)") echo "$hist" local run=($(echo "${hist[*]}" | awk '{print $4}')) local hndls=($(echo "${hist[*]}" | awk '{print $8}')) @@ -118,10 +128,11 @@ check_jbd_values () { check_jbd_values_facets () { local facets=$1 local thrhi=$2 + local rtime=$3 local facet local rc=0 for facet in ${facets//,/ }; do - check_jbd_values $facet $thrhi || rc=$((rc+$?)) + check_jbd_values $facet $thrhi $rtime || rc=$((rc+$?)) done return $rc } @@ -129,14 +140,21 @@ check_jbd_values_facets () { test_1b () { local param_file=$TMP/$tfile-params - do_nodesv $(comma_list $(osts_nodes)) lctl get_param obdfilter.${FSNAME}-*.sync_journal - - save_lustre_params $(comma_list $(osts_nodes)) "obdfilter.${FSNAME}-*.sync_journal" >$param_file - do_nodesv $(comma_list $(osts_nodes)) lctl set_param obdfilter.${FSNAME}-*.sync_journal=0 + do_nodesv $(comma_list $(osts_nodes)) \ + $LCTL get_param obdfilter.${FSNAME}-*.sync_journal + save_lustre_params $(get_facets OST) \ + "obdfilter.${FSNAME}-*.sync_journal" > $param_file + do_nodesv $(comma_list $(osts_nodes)) \ + $LCTL set_param obdfilter.${FSNAME}-*.sync_journal=0 + local stime=$(date +%s) thrlo=4 nobjhi=1 thrhi=4 obdflter_survey_run disk + local etime=$(date +%s) + # run time of obd survey + local rtime=$((etime - stime)) - check_jbd_values_facets $(get_facets OST) 4 || rc=$((rc+$?)) + echo "obd survey finished in $rtime seconds" + check_jbd_values_facets $(get_facets OST) 4 $rtime || rc=$((rc+$?)) restore_lustre_params < $param_file @@ -145,6 +163,12 @@ test_1b () { } run_test 1b "Object Storage Targets survey, async journal" +test_1c () { + nobjlo=1 nobjhi=1 thrlo=32 thrhi=32 rszlo=1024 rszhi=1024 size=8192\ + obdflter_survey_run disk +} +run_test 1c "Object Storage Targets survey, big batch" + test_2a () { obdflter_survey_run netdisk } @@ -153,14 +177,20 @@ run_test 2a "Stripe F/S over the Network" test_2b () { local param_file=$TMP/$tfile-params - do_nodesv $(comma_list $(osts_nodes)) lctl get_param obdfilter.${FSNAME}-*.sync_journal - - save_lustre_params $(comma_list $(osts_nodes)) "obdfilter.${FSNAME}-*.sync_journal" >$param_file - do_nodesv $(comma_list $(osts_nodes)) lctl set_param obdfilter.${FSNAME}-*.sync_journal=0 + do_nodesv $(comma_list $(osts_nodes)) \ + $LCTL get_param obdfilter.${FSNAME}-*.sync_journal + save_lustre_params $(get_facets OST) \ + "obdfilter.${FSNAME}-*.sync_journal" > $param_file + do_nodesv $(comma_list $(osts_nodes)) \ + $LCTL set_param obdfilter.${FSNAME}-*.sync_journal=0 + local stime=$(date +%s) thrlo=4 nobjhi=1 thrhi=4 obdflter_survey_run netdisk + local etime=$(date +%s) + local rtime=$((etime - stime)) - check_jbd_values_facets $(get_facets OST) 4 || rc=$((rc+$?)) + echo "obd survey finished in $rtime seconds" + check_jbd_values_facets $(get_facets OST) 4 $rtime || rc=$((rc+$?)) restore_lustre_params < $param_file @@ -184,7 +214,7 @@ test_3a () { } run_test 3a "Network survey" -complete $(basename $0) $SECONDS +complete $SECONDS cleanup_echo_devs check_and_cleanup_lustre exit_status