X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Ftests%2Fobdfilter-survey.sh;h=23e2156fedab0af539d06004f7701af0cc74b2e2;hp=66ec822d8e6644c6b5ee13a9499364c1df407327;hb=56f69854dae234fa974ab4f1dff909aea601a592;hpb=16ddb77519b26ea8df18b5abd84afb03d08c47dc

diff --git a/lustre/tests/obdfilter-survey.sh b/lustre/tests/obdfilter-survey.sh
index 66ec822..23e2156 100644
--- a/lustre/tests/obdfilter-survey.sh
+++ b/lustre/tests/obdfilter-survey.sh
@@ -1,34 +1,27 @@
 #!/bin/bash
-#set -x
 set -e
 
-LUSTRE=${LUSTRE:-`dirname $0`/..}
+LUSTRE=${LUSTRE:-$(dirname $0)/..}
 . $LUSTRE/tests/test-framework.sh
 init_test_env $@
+init_logging
 
-nobjhi=${nobjhi:-1}
-thrhi=${thrhi:-16}
-size=${size:-1024}
+# bug number for skipped test:
+ALWAYS_EXCEPT="$OBDFILTER_SURVEY_EXCEPT "
+# UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT!
 
-# the summary file a bit smaller than OSTSIZE
-. ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh}
+build_test_filter
 
 [ "$SLOW" = no ] && { nobjhi=1; thrhi=4; }
+nobjhi=${nobjhi:-1}
+thrhi=${thrhi:-16}
+size=${size:-1024}
 thrlo=${thrlo:-$(( thrhi / 2))}
 
-# Skip these tests
-# bug number   23791 23791
-ALWAYS_EXCEPT="1b    2b    $OBDFILTER_SURVEY_EXCEPT"
-
 OBDSURVEY=${OBDSURVEY:-$(which obdfilter-survey)}
 
-build_test_filter
 check_and_setup_lustre
 
-min_ost_size () {
-    $LCTL get_param -n osc.*.kbytesavail | sort -n | head -n1
-}
-
 # FIXME: the summary file a bit smaller than OSTSIZE, add estimation
 minsize=$(min_ost_size)
 if [ $(( size * 1024 )) -ge $minsize  ]; then
@@ -37,20 +30,27 @@ if [ $(( size * 1024 )) -ge $minsize  ]; then
 fi
 
 get_targets () {
-        local targets
-        local devs
-        local oss
-
-        for oss in $(osts_nodes); do
-                devs=$(do_node $oss "lctl dl |grep obdfilter |sort" | awk '{print $4}')
-                for d in $devs; do
-                        # if oss is local -- obdfilter-survey needs dev wo/ host
-                        target=$d
-                        [[ $oss = `hostname` ]] || target=$oss:$target
-                        targets="$targets $target"
-                done
-        done
-
+	local targets
+	local target
+	local dev
+	local nid
+	local osc
+
+	for osc in $($LCTL get_param -N osc.${FSNAME}-*osc-*); do
+		nid=$($LCTL get_param $osc.import |
+			awk '/current_connection:/ {sub(/@.*/,""); print $2}')
+		dev=$(echo $osc | sed -e 's/^osc\.//' -e 's/-osc.*//')
+		target=$dev
+
+		# For local disk obdfilter-survey requires target devs w/o nid.
+		# obdfilter-survey :
+		# case 1 (local disk):
+		#    $ nobjhi=2 thrhi=2 size=1024
+		#      targets="$nid:$FSNAME-OST0000 $nid:$FSNAME-OST0001 ..."
+		#                 ./obdfilter-survey
+		local_node && [ "$1" == "disk" ] || target=$nid:$target
+		targets="$targets $target"
+	done
 	echo $targets
 }
 
@@ -59,9 +59,9 @@ obdflter_survey_targets () {
 	local targets
 
 	case $case in
-		disk)    targets=$(get_targets);;
-		netdisk) targets=$(get_targets);;
-		network) targets="$(osts_nodes)";;
+		disk)    targets=$(get_targets $case);;
+		netdisk) targets=$(get_targets $case);;
+		network) targets=$(host_nids_address $(comma_list $(osts_nodes)) $NETTYPE);;
 		*) error "unknown obdflter-survey case!" ;;
 	esac
 	echo $targets
@@ -76,78 +76,46 @@ obdflter_survey_run () {
 	local cmd="NETTYPE=$NETTYPE thrlo=$thrlo nobjhi=$nobjhi thrhi=$thrhi size=$size case=$case rslt_loc=${TMP} targets=\"$targets\" $OBDSURVEY"
 	echo + $cmd
 	eval $cmd
+	local rc=$?
 
 	cat ${TMP}/obdfilter_survey*
+	[ $rc = 0 ] || error "$OBDSURVEY failed: $rc"
 }
+
 test_1a () {
 	obdflter_survey_run disk
 }
 run_test 1a "Object Storage Targets survey"
 
-print_jbd () {
-	local file=$1
-	local facet=$2
-	local varsvc=${facet}_svc
-	local dev=$(ldiskfs_canon "*.${!varsvc}.mntdev" $facet)
-
-	# ext4: /proc/fs/jbd2/sda1:8/history 
-	# ext3: /proc/fs/jbd/sdb1/history
-
-	do_facet $facet cat /proc/fs/jbd*/${dev}*/$file
-}
-
-check_jbd_values () {
-	local facet=$1
-	local thrhi=$2
-
-	# last two lines from history
-	# $4: run >= 5000
-	# $8: hndls >= thrhi * 2
-	local hist=("$(print_jbd history $facet | tail -3 | head -2)")
-	echo "$hist"
-	local run=($(echo "${hist[*]}" | awk '{print $4}'))
-	local hndls=($(echo "${hist[*]}" | awk '{print $8}'))
-
-	local rc=0
-	for (( i=0; i<1; i++)); do
-		[[ ${run[i]} -lt 5000 ]] && \
-			error "$facet: run expected 5000, have ${run[i]}" && rc=1
-		[[ ${hndls[i]} -lt $((thrhi * 2)) ]] && \
-			error "$facet: hndls expected > $((thrhi * 2)), have ${hndls[i]}" && rc=2
-	done
-	return $rc
-}
-
-check_jbd_values_facets () {
-	local facets=$1
-	local thrhi=$2
-	local facet
-	local rc=0
-	for facet in  ${facets//,/ }; do
-		check_jbd_values $facet $thrhi || rc=$((rc+$?))
-	done
-	return $rc
-}
-
 test_1b () {
 	local param_file=$TMP/$tfile-params
 
-	do_nodesv $(comma_list $(osts_nodes)) lctl get_param obdfilter.${FSNAME}-*.sync_journal
-
-	save_lustre_params $(comma_list $(osts_nodes)) "obdfilter.${FSNAME}-*.sync_journal" >$param_file
-	do_nodesv $(comma_list $(osts_nodes)) lctl set_param obdfilter.${FSNAME}-*.sync_journal=0
+	do_nodesv $(comma_list $(osts_nodes)) \
+		$LCTL get_param obdfilter.${FSNAME}-*.sync_journal
+	save_lustre_params $(get_facets OST) \
+		"obdfilter.${FSNAME}-*.sync_journal" > $param_file
+	do_nodesv $(comma_list $(osts_nodes)) \
+		$LCTL set_param obdfilter.${FSNAME}-*.sync_journal=0
 
+	local stime=$(date +%s)
 	thrlo=4 nobjhi=1 thrhi=4 obdflter_survey_run disk
+	local etime=$(date +%s)
+	# run time of obd survey
+	local rtime=$((etime - stime))
 
-	check_jbd_values_facets $(get_facets OST) 4 || rc=$((rc+$?))
-
+	echo "obd survey finished in $rtime seconds"
 	restore_lustre_params < $param_file
 
 	rm -f $param_file
-	return $rc
 }
 run_test 1b "Object Storage Targets survey, async journal"
 
+test_1c () {
+	nobjlo=1 nobjhi=1 thrlo=32 thrhi=32 rszlo=1024 rszhi=1024 size=8192\
+	obdflter_survey_run disk
+}
+run_test 1c "Object Storage Targets survey, big batch"
+
 test_2a () {
 	obdflter_survey_run netdisk
 }
@@ -156,29 +124,38 @@ run_test 2a "Stripe F/S over the Network"
 test_2b () {
 	local param_file=$TMP/$tfile-params
 
-	do_nodesv $(comma_list $(osts_nodes)) lctl get_param obdfilter.${FSNAME}-*.sync_journal
-
-	save_lustre_params $(comma_list $(osts_nodes)) "obdfilter.${FSNAME}-*.sync_journal" >$param_file
-	do_nodesv $(comma_list $(osts_nodes)) lctl set_param obdfilter.${FSNAME}-*.sync_journal=0
+	do_nodesv $(comma_list $(osts_nodes)) \
+		$LCTL get_param obdfilter.${FSNAME}-*.sync_journal
+	save_lustre_params $(get_facets OST) \
+		"obdfilter.${FSNAME}-*.sync_journal" > $param_file
+	do_nodesv $(comma_list $(osts_nodes)) \
+		$LCTL set_param obdfilter.${FSNAME}-*.sync_journal=0
 
+	local stime=$(date +%s)
 	thrlo=4 nobjhi=1 thrhi=4 obdflter_survey_run netdisk
+	local etime=$(date +%s)
+	local rtime=$((etime - stime))
 
-	check_jbd_values_facets $(get_facets OST) 4 || rc=$((rc+$?))
-
+	echo "obd survey finished in $rtime seconds"
 	restore_lustre_params < $param_file
 
 	rm -f $param_file
-	return $rc
 }
 run_test 2b "Stripe F/S over the Network, async journal"
 
 
 # README.obdfilter-survey: In network test only automated run is supported.
 test_3a () {
-	remote_servers || { skip "Local servers" && return 0; }
+	# obdfilter-survey Prerequisite:
+	#    For "network" case  you need to have all
+	#    modules (those llmount.sh loads) loaded in kernel. And the
+	#    'lctl dl' output must be blank.
+	# Skipping test for CLIENTONLY mode because of
+	# cleanupall()->stopall() does not cleanup the servers on this mode.
+	[ "$CLIENTONLY" ] && skip "CLIENTONLY mode"
+
+	remote_servers || skip "Local servers"
 
-	# The Network survey test needs:
-	# Start lctl and check for the device list. The device list must be empty.
 	cleanupall
 
 	obdflter_survey_run network
@@ -187,7 +164,7 @@ test_3a () {
 }
 run_test 3a "Network survey"
 
-equals_msg `basename $0`: test complete, cleaning up
+complete $SECONDS
 cleanup_echo_devs
 check_and_cleanup_lustre
-[ -f "$TESTSUITELOG" ] && cat $TESTSUITELOG && grep -q FAIL $TESTSUITELOG && exit 1 || true
+exit_status