X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Ftests%2Fsanity.sh;h=07527027bc0804704b406778774604fca04569ce;hp=a32da55cef426365bb326a9f84c38dbbebf0be62;hb=219e03a261e510e1551ab0695633cc4d2f5196fb;hpb=d88d6cfc5ae37da2ce4c834543a4afd980e04c4e diff --git a/lustre/tests/sanity.sh b/lustre/tests/sanity.sh index a32da55..0752702 100644 --- a/lustre/tests/sanity.sh +++ b/lustre/tests/sanity.sh @@ -1,4 +1,6 @@ #!/bin/bash +# -*- mode: Bash; tab-width: 4; indent-tabs-mode: t; -*- +# vim:autoindent:shiftwidth=4:tabstop=4: # # Run select tests by setting ONLY, or as arguments to the script. # Skip specific tests by setting EXCEPT. @@ -7,8 +9,8 @@ set -e ONLY=${ONLY:-"$*"} -# bug number for skipped test: 16823 13297 2108 9789 3637 9789 3561 12622 12653 12653 5188 10764 16260 -ALWAYS_EXCEPT=" 27s 27u 42a 42b 42c 42d 45 51d 65a 65e 68b 75 119d $SANITY_EXCEPT" +# bug number for skipped test: 13297 2108 9789 3637 9789 3561 12622 12653 12653 5188 16260 19742 +ALWAYS_EXCEPT=" 27u 42a 42b 42c 42d 45 51d 65a 65e 68b $SANITY_EXCEPT" # bug number for skipped test: 2108 9789 3637 9789 3561 5188/5749 1443 #ALWAYS_EXCEPT=${ALWAYS_EXCEPT:-"27m 42a 42b 42c 42d 45 68 76"} # UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT! @@ -40,7 +42,6 @@ GETSTRIPE=${GETSTRIPE:-"$LFS getstripe"} LSTRIPE=${LSTRIPE:-"$LFS setstripe"} LFIND=${LFIND:-"$LFS find"} LVERIFY=${LVERIFY:-ll_dirstripe_verify} -LSTRIPEINFO=${LSTRIPEINFO:-ll_getstripe_info} LCTL=${LCTL:-lctl} MCREATE=${MCREATE:-mcreate} OPENFILE=${OPENFILE:-openfile} @@ -71,8 +72,9 @@ LUSTRE=${LUSTRE:-$(cd $(dirname $0)/..; echo $PWD)} . $LUSTRE/tests/test-framework.sh init_test_env $@ . ${CONFIG:=$LUSTRE/tests/cfg/${NAME}.sh} +init_logging -[ "$SLOW" = "no" ] && EXCEPT_SLOW="24o 27m 36f 36g 51b 51c 60c 63 64b 68 71 73 77f 78 101 103 115 120g 124b" +[ "$SLOW" = "no" ] && EXCEPT_SLOW="24o 24v 27m 36f 36g 36h 51b 51c 60c 63 64b 68 71 73 77f 78 101 103 115 120g 124b" SANITYLOG=${TESTSUITELOG:-$TMP/$(basename $0 .sh).log} FAIL_ON_ERROR=false @@ -90,11 +92,12 @@ setup() { } check_kernel_version() { - VERSION_FILE=version WANT_VER=$1 - GOT_VER=$(lctl get_param -n $VERSION_FILE | awk '/kernel:/ {print $2}') - [ $GOT_VER == "patchless" ] && return 0 - [ $GOT_VER -ge $WANT_VER ] && return 0 + GOT_VER=$(lctl get_param -n version | awk '/kernel:/ {print $2}') + case $GOT_VER in + patchless|patchless_client) return 0;; + *) [ $GOT_VER -ge $WANT_VER ] && return 0 ;; + esac log "test needs at least kernel version $WANT_VER, running $GOT_VER" return 1 } @@ -246,7 +249,7 @@ test_6a() { run_test 6a "touch .../f6a; chmod .../f6a ======================" test_6b() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return if [ ! -f $DIR/f6a ]; then touch $DIR/f6a chmod 0666 $DIR/f6a @@ -257,7 +260,7 @@ test_6b() { run_test 6b "$RUNAS chmod .../f6a (should return error) ==" test_6c() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return touch $DIR/f6c chown $RUNAS_ID $DIR/f6c || error $CHECKSTAT -t file -u \#$RUNAS_ID $DIR/f6c || error @@ -265,7 +268,7 @@ test_6c() { run_test 6c "touch .../f6c; chown .../f6c ======================" test_6d() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return if [ ! -f $DIR/f6c ]; then touch $DIR/f6c chown $RUNAS_ID $DIR/f6c @@ -276,7 +279,7 @@ test_6d() { run_test 6d "$RUNAS chown .../f6c (should return error) ==" test_6e() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return touch $DIR/f6e chgrp $RUNAS_ID $DIR/f6e || error $CHECKSTAT -t file -u \#$UID -g \#$RUNAS_ID $DIR/f6e || error @@ -284,7 +287,7 @@ test_6e() { run_test 6e "touch .../f6e; chgrp .../f6e ======================" test_6f() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return if [ ! -f $DIR/f6e ]; then touch $DIR/f6e chgrp $RUNAS_ID $DIR/f6e @@ -295,7 +298,7 @@ test_6f() { run_test 6f "$RUNAS chgrp .../f6e (should return error) ==" test_6g() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return mkdir $DIR/d6g || error chmod 777 $DIR/d6g || error $RUNAS mkdir $DIR/d6g/d || error @@ -306,7 +309,7 @@ test_6g() { run_test 6g "Is new dir in sgid dir inheriting group?" test_6h() { # bug 7331 - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return touch $DIR/f6h || error "touch failed" chown $RUNAS_ID:$RUNAS_ID $DIR/f6h || error "initial chown failed" $RUNAS -G$RUNAS_ID chown $RUNAS_ID:0 $DIR/f6h && error "chown worked" @@ -473,6 +476,26 @@ test_17g() { } run_test 17g "symlinks: really long symlink name ===============================" +test_17h() { #bug 17378 + mkdir -p $DIR/$tdir + $SETSTRIPE $DIR/$tdir -c -1 +#define OBD_FAIL_MDS_LOV_PREP_CREATE 0x141 + do_facet mds lctl set_param fail_loc=0x80000141 + touch $DIR/$tdir/$tfile || true +} +run_test 17h "create objects: lov_free_memmd() doesn't lbug" + +test_17i() { #bug 20018 + mkdir -p $DIR/$tdir + local foo=$DIR/$tdir/$tfile + ln -s $foo $foo || error "create symlink failed" +#define OBD_FAIL_MDS_READLINK_EPROTO 0x143 + do_facet mds lctl set_param fail_loc=0x80000143 + ls -l $foo && error "error not detected" + return 0 +} +run_test 17i "don't panic on short symlink" + test_18() { touch $DIR/f ls $DIR || error @@ -493,7 +516,7 @@ test_19b() { run_test 19b "ls -l .../f19 (should return error) ==============" test_19c() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return $RUNAS touch $DIR/f19 && error || true } run_test 19c "$RUNAS touch .../f19 (should return error) ==" @@ -541,7 +564,8 @@ test_22() { } run_test 22 "unpack tar archive as non-root user ===============" -test_23() { +# was test_23 +test_23a() { mkdir -p $DIR/$tdir local file=$DIR/$tdir/$tfile @@ -549,7 +573,19 @@ test_23() { openfile -f O_CREAT:O_EXCL $file && error "$file recreate succeeded" || true } -run_test 23 "O_CREAT|O_EXCL in subdir ==========================" +run_test 23a "O_CREAT|O_EXCL in subdir ==========================" + +test_23b() { # bug 18988 + mkdir -p $DIR/$tdir + local file=$DIR/$tdir/$tfile + + rm -f $file + echo foo > $file || error "write filed" + echo bar >> $file || error "append filed" + $CHECKSTAT -s 8 $file || error "wrong size" + rm $file +} +run_test 23b "O_APPEND check ==========================" test_24a() { echo '== rename sanity ==============================================' @@ -633,7 +669,7 @@ test_24i() { mrename $DIR/R9/f $DIR/R9/a $CHECKSTAT -t file $DIR/R9/f || error $CHECKSTAT -t dir $DIR/R9/a || error - $CHECKSTAT -a file $DIR/R9/a/f || error + $CHECKSTAT -a $DIR/R9/a/f || error } run_test 24i "rename file to dir error: touch f ; mkdir a ; rename f a" @@ -746,6 +782,21 @@ test_24u() { # bug12192 } run_test 24u "create stripe file" +test_24v() { + local NRFILES=100000 + local FREE_INODES=`lfs df -i|grep "filesystem summary" | awk '{print $5}'` + [ $FREE_INODES -lt $NRFILES ] && \ + skip "not enough free inodes $FREE_INODES required $NRFILES" && \ + return + + mkdir -p $DIR/d24v + createmany -m $DIR/d24v/$tfile $NRFILES + ls $DIR/d24v >/dev/null || error "error in listing large dir" + + rm $DIR/d24v -rf +} +run_test 24v "list directory with large files (handle hash collision, bug: 17560)" + test_25a() { echo '== symlink sanity =============================================' @@ -829,7 +880,7 @@ test_27a() { run_test 27a "one stripe file ==================================" test_27c() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping 2-stripe test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping 2-stripe test" && return mkdir -p $DIR/d27 $SETSTRIPE $DIR/d27/f01 -c 2 || error "lstripe failed" [ `$GETSTRIPE $DIR/d27/f01 | grep -A 10 obdidx | wc -l` -eq 4 ] || @@ -906,7 +957,7 @@ test_27l() { run_test 27l "check setstripe permissions (should return error)" test_27m() { - [ "$OSTCOUNT" -lt "2" ] && skip "$OSTCOUNT < 2 OSTs -- skipping" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "$OSTCOUNT < 2 OSTs -- skipping" && return if [ $ORIGFREE -gt $MAXFREE ]; then skip "$ORIGFREE > $MAXFREE skipping out-of-space test on OST0" return @@ -933,22 +984,30 @@ test_27m() { } run_test 27m "create file while OST0 was full ==================" -# osc's keep a NOSPC stick flag that gets unset with rmdir +sleep_maxage() { + local DELAY=$(do_facet mds lctl get_param -n lov.*.qos_maxage | head -n 1 | awk '{print $1 * 2}') + sleep $DELAY +} + +# OSCs keep a NOSPC flag that will be reset after ~5s (qos_maxage) +# if the OST isn't full anymore. reset_enospc() { - local FAIL_LOC=${1:-0} - local OSTIDX=${2:-""} + local OSTIDX=${1:-""} - mkdir -p $DIR/d27/nospc - rmdir $DIR/d27/nospc local list=$(comma_list $(osts_nodes)) [ "$OSTIDX" ] && list=$(facet_host ost$((OSTIDX + 1))) - do_nodes $list lctl set_param fail_loc=$FAIL_LOC + do_nodes $list lctl set_param fail_loc=0 + sleep_maxage } exhaust_precreations() { local OSTIDX=$1 - local MDSIDX=$(get_mds_dir "$DIR/d27") + local FAILLOC=$2 + local FAILIDX=${3:-$OSTIDX} + + mkdir -p $DIR/$tdir + local MDSIDX=$(get_mds_dir "$DIR/$tdir") echo OSTIDX=$OSTIDX MDSIDX=$MDSIDX local OST=$(lfs osts | grep ${OSTIDX}": " | \ @@ -960,111 +1019,111 @@ exhaust_precreations() { local last_id=$(do_facet mds${MDSIDX} lctl get_param -n osc.*${OST}-osc-${MDT_INDEX}.prealloc_last_id) local next_id=$(do_facet mds${MDSIDX} lctl get_param -n osc.*${OST}-osc-${MDT_INDEX}.prealloc_next_id) - echo ${OST}-osc-${MDT_INDEX}.prealloc_last_id=$last_id - echo ${OST}-osc-${MDT_INDEX}.prealloc_next_id=$next_id + do_facet mds${MDSIDX} lctl get_param osc.*OST*-osc-${MDT_INDEX}.prealloc* - mkdir -p $DIR/d27 - $SETSTRIPE $DIR/d27 -i $OSTIDX -c 1 + mkdir -p $DIR/$tdir/${OST} + $SETSTRIPE $DIR/$tdir/${OST} -i $OSTIDX -c 1 #define OBD_FAIL_OST_ENOSPC 0x215 + do_facet ost$((OSTIDX + 1)) lctl set_param fail_val=$FAILIDX do_facet ost$((OSTIDX + 1)) lctl set_param fail_loc=0x215 echo "Creating to objid $last_id on ost $OST..." - createmany -o $DIR/d27/${OST}-f $next_id $((last_id - next_id + 2)) - do_facet mds${MDSIDX} lctl get_param osc.*${OST}-osc-${MDT_INDEX}.prealloc* | grep '[0-9]' - reset_enospc $2 $OSTIDX + createmany -o $DIR/$tdir/${OST}/f $next_id $((last_id - next_id + 2)) + do_facet mds${MDSIDX} lctl get_param osc.*OST*-osc-${MDT_INDEX}.prealloc* + do_facet ost$((OSTIDX + 1)) lctl set_param fail_loc=$FAILLOC + sleep_maxage } exhaust_all_precreations() { local i for (( i=0; i < OSTCOUNT; i++ )) ; do - exhaust_precreations $i 0x215 + exhaust_precreations $i $1 -1 done - reset_enospc $1 } test_27n() { - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return reset_enospc - rm -f $DIR/d27/f27n - $SETSTRIPE $DIR/d27 -c 1 -i -1 + rm -f $DIR/$tdir/$tfile exhaust_precreations 0 0x80000215 - - touch $DIR/d27/f27n || error - + $SETSTRIPE -c -1 $DIR/$tdir + touch $DIR/$tdir/$tfile || error + $GETSTRIPE $DIR/$tdir/$tfile reset_enospc } run_test 27n "create file with some full OSTs ==================" test_27o() { - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return reset_enospc - rm -f $DIR/d27/f27o + rm -f $DIR/$tdir/$tfile exhaust_all_precreations 0x215 - sleep 5 - touch $DIR/d27/f27o && error "able to create $DIR/d27/f27o" + touch $DIR/$tdir/$tfile && error "able to create $DIR/$tdir/$tfile" reset_enospc - rm -rf $DIR/d27/* + rm -rf $DIR/$tdir/* } run_test 27o "create file with all full OSTs (should error) ====" test_27p() { - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return reset_enospc - rm -f $DIR/d27/f27p + rm -f $DIR/$tdir/$tfile + mkdir -p $DIR/$tdir - $MCREATE $DIR/d27/f27p || error "mcreate failed" - $TRUNCATE $DIR/d27/f27p 80000000 || error "truncate failed" - $CHECKSTAT -s 80000000 $DIR/d27/f27p || error "checkstat failed" + $MCREATE $DIR/$tdir/$tfile || error "mcreate failed" + $TRUNCATE $DIR/$tdir/$tfile 80000000 || error "truncate failed" + $CHECKSTAT -s 80000000 $DIR/$tdir/$tfile || error "checkstat failed" exhaust_precreations 0 0x80000215 - echo foo >> $DIR/d27/f27p || error "append failed" - $CHECKSTAT -s 80000004 $DIR/d27/f27p || error "checkstat failed" + echo foo >> $DIR/$tdir/$tfile || error "append failed" + $CHECKSTAT -s 80000004 $DIR/$tdir/$tfile || error "checkstat failed" + $LFS getstripe $DIR/$tdir/$tfile reset_enospc } run_test 27p "append to a truncated file with some full OSTs ===" test_27q() { - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return reset_enospc - rm -f $DIR/d27/f27q + rm -f $DIR/$tdir/$tfile - $MCREATE $DIR/d27/f27q || error "mcreate $DIR/d27/f27q failed" - $TRUNCATE $DIR/d27/f27q 80000000 ||error "truncate $DIR/d27/f27q failed" - $CHECKSTAT -s 80000000 $DIR/d27/f27q || error "checkstat failed" + $MCREATE $DIR/$tdir/$tfile || error "mcreate $DIR/$tdir/$tfile failed" + $TRUNCATE $DIR/$tdir/$tfile 80000000 ||error "truncate $DIR/$tdir/$tfile failed" + $CHECKSTAT -s 80000000 $DIR/$tdir/$tfile || error "checkstat failed" exhaust_all_precreations 0x215 - echo foo >> $DIR/d27/f27q && error "append succeeded" - $CHECKSTAT -s 80000000 $DIR/d27/f27q || error "checkstat 2 failed" + echo foo >> $DIR/$tdir/$tfile && error "append succeeded" + $CHECKSTAT -s 80000000 $DIR/$tdir/$tfile || error "checkstat 2 failed" reset_enospc } run_test 27q "append to truncated file with all OSTs full (should error) ===" test_27r() { - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return reset_enospc - rm -f $DIR/d27/f27r + rm -f $DIR/$tdir/$tfile exhaust_precreations 0 0x80000215 - $SETSTRIPE $DIR/d27/f27r -i 0 -c 2 # && error + $SETSTRIPE $DIR/$tdir/$tfile -i 0 -c 2 # && error reset_enospc } @@ -1074,7 +1133,7 @@ test_27s() { # bug 10725 mkdir -p $DIR/$tdir local stripe_size=$((4096 * 1024 * 1024)) # 2^32 local stripe_count=0 - [ $OSTCOUNT -eq 1 ] || stripe_count=2 + [ $OSTCOUNT -eq 1 ] || stripe_count=2 $SETSTRIPE $DIR/$tdir -s $stripe_size -c $stripe_count && \ error "stripe width >= 2^32 succeeded" || true @@ -1092,30 +1151,31 @@ test_27t() { # bug 10864 run_test 27t "check that utils parse path correctly" test_27u() { # bug 4900 - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return #define OBD_FAIL_MDS_OSC_PRECREATE 0x139 do_facet $SINGLEMDS lctl set_param fail_loc=0x139 - mkdir -p $DIR/d27u - createmany -o $DIR/d27u/t- 1000 + mkdir -p $DIR/$tdir + createmany -o $DIR/$tdir/t- 1000 do_facet $SINGLEMDS lctl set_param fail_loc=0 TLOG=$DIR/$tfile.getstripe - $GETSTRIPE $DIR/d27u > $TLOG + $GETSTRIPE $DIR/$tdir > $TLOG OBJS=`awk -vobj=0 '($1 == 0) { obj += 1 } END { print obj;}' $TLOG` - unlinkmany $DIR/d27u/t- 1000 + unlinkmany $DIR/$tdir/t- 1000 [ $OBJS -gt 0 ] && \ error "$OBJS objects created on OST-0. See $TLOG" || pass } run_test 27u "skip object creation on OSC w/o objects ==========" test_27v() { # bug 4900 - [ "$OSTCOUNT" -lt "2" ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return remote_ost_nodsh && skip "remote OST with nodsh" && return - exhaust_all_precreations + exhaust_all_precreations 0x215 + reset_enospc mkdir -p $DIR/$tdir $SETSTRIPE $DIR/$tdir -c 1 # 1 stripe / file @@ -1129,8 +1189,6 @@ test_27v() { # bug 4900 local START=`date +%s` createmany -o $DIR/$tdir/$tfile 32 - reset_enospc - local FINISH=`date +%s` local TIMEOUT=`lctl get_param -n timeout` [ $((FINISH - START)) -ge $((TIMEOUT / 2)) ] && \ @@ -1141,24 +1199,89 @@ test_27v() { # bug 4900 run_test 27v "skip object creation on slow OST =================" test_27w() { # bug 10997 - mkdir -p $DIR/d27w || error "mkdir failed" - $LSTRIPE $DIR/d27w/f0 -s 65536 || error "lstripe failed" - size=`$LSTRIPEINFO $DIR/d27w/f0 | awk {'print $1'}` + mkdir -p $DIR/$tdir || error "mkdir failed" + $LSTRIPE $DIR/$tdir/f0 -s 65536 || error "lstripe failed" + size=`$GETSTRIPE $DIR/$tdir/f0 -s` [ $size -ne 65536 ] && error "stripe size $size != 65536" || true + gsdir=$($LFS getstripe -d $DIR/$tdir) + [ $(echo $gsdir | grep -c stripe_count) -ne 1 ] && error "$LFS getstripe -d $DIR/$tdir failed" - [ "$OSTCOUNT" -lt "2" ] && skip "skipping multiple stripe count/offset test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping multiple stripe count/offset test" && return for i in `seq 1 $OSTCOUNT`; do offset=$(($i-1)) - $LSTRIPE $DIR/d27w/f$i -c $i -i $offset || error "lstripe -c $i -i $offset failed" - count=`$LSTRIPEINFO $DIR/d27w/f$i | awk {'print $2'}` - index=`$LSTRIPEINFO $DIR/d27w/f$i | awk {'print $3'}` + $LSTRIPE $DIR/$tdir/f$i -c $i -i $offset || error "lstripe -c $i -i $offset failed" + count=`$GETSTRIPE -c $DIR/$tdir/f$i` + index=`$GETSTRIPE -o $DIR/$tdir/f$i` [ $count -ne $i ] && error "stripe count $count != $i" || true [ $index -ne $offset ] && error "stripe offset $index != $offset" || true done } run_test 27w "check lfs setstripe -c -s -i options =============" -# createtest also checks that device nodes are created and +test_27x() { + [ "$OSTCOUNT" -lt "2" ] && skip_env "$OSTCOUNT < 2 OSTs" && return + OFFSET=$(($OSTCOUNT - 1)) + OSTIDX=0 + local OST=$(lfs osts | awk '/'${OSTIDX}': / { print $2 }' | sed -e 's/_UUID$//') + + mkdir -p $DIR/$tdir + $SETSTRIPE $DIR/$tdir -c 1 # 1 stripe per file + do_facet ost$((OSTIDX + 1)) lctl set_param -n obdfilter.$OST.degraded 1 + sleep_maxage + createmany -o $DIR/$tdir/$tfile $OSTCOUNT + for i in `seq 0 $OFFSET`; do + [ `$GETSTRIPE $DIR/$tdir/$tfile$i | grep -A 10 obdidx | awk '{print $1}' | grep -w "$OSTIDX"` ] && + error "OST0 was degraded but new created file still use it" + done + do_facet ost$((OSTIDX + 1)) lctl set_param -n obdfilter.$OST.degraded 0 +} +run_test 27x "create files while OST0 is degraded" + +test_27y() { + [ "$OSTCOUNT" -lt "2" ] && skip_env "$OSTCOUNT < 2 OSTs -- skipping" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return + + local last_id=$(do_facet $SINGLEMDS lctl get_param -n osc.*0000-osc-MDT0000.prealloc_last_id) + local next_id=$(do_facet $SINGLEMDS lctl get_param -n osc.*0000-osc-MDT0000.prealloc_next_id) + local fcount=$((last_id - next_id)) + [ $fcount -eq 0 ] && skip "not enough space on OST0" && return + [ $fcount -gt $OSTCOUNT ] && fcount=$OSTCOUNT + + MDS_OSCS=`do_facet mds lctl dl | awk '/[oO][sS][cC].*md[ts]/ { print $4 }'` + OFFSET=$(($OSTCOUNT-1)) + OST=-1 + for OSC in $MDS_OSCS; do + if [ $OST == -1 ]; then { + OST=`osc_to_ost $OSC` + } else { + echo $OSC "is Deactivate:" + do_facet mds lctl --device %$OSC deactivate + } fi + done + + OSTIDX=$(lfs osts | grep ${OST} | awk '{print $1}' | sed -e 's/://') + mkdir -p $DIR/$tdir + $SETSTRIPE $DIR/$tdir -c 1 # 1 stripe / file + + do_facet ost$OSTIDX lctl set_param -n obdfilter.$OST.degraded 1 + sleep_maxage + createmany -o $DIR/$tdir/$tfile $fcount + do_facet ost$OSTIDX lctl set_param -n obdfilter.$OST.degraded 0 + + for i in `seq 0 $OFFSET`; do + [ `$GETSTRIPE $DIR/$tdir/$tfile$i | grep -A 10 obdidx | awk '{print $1}'| grep -w "$OSTIDX"` ] || \ + error "files created on deactivated OSTs instead of degraded OST" + done + for OSC in $MDS_OSCS; do + [ `osc_to_ost $OSC` != $OST ] && { + echo $OSC "is activate" + do_facet mds lctl --device %$OSC activate + } + done +} +run_test 27y "create files while OST0 is degraded and the rest inactive" + +# createtest also checks that device nodes are created and # then visible correctly (#2091) test_28() { # bug 2091 mkdir $DIR/d28 @@ -1664,6 +1787,23 @@ test_34f() { # bug 6242, 6243 } run_test 34f "read from a file with no objects until EOF =======" +test_34g() { + dd if=/dev/zero of=$DIR/$tfile bs=1 count=100 seek=$TEST_34_SIZE || error + $TRUNCATE $DIR/$tfile $((TEST_34_SIZE / 2))|| error + $CHECKSTAT -s $((TEST_34_SIZE / 2)) $DIR/$tfile || error "truncate failed" + cancel_lru_locks osc + $CHECKSTAT -s $((TEST_34_SIZE / 2)) $DIR/$tfile || \ + error "wrong size after lock cancel" + + $TRUNCATE $DIR/$tfile $TEST_34_SIZE || error + $CHECKSTAT -s $TEST_34_SIZE $DIR/$tfile || \ + error "expanding truncate failed" + cancel_lru_locks osc + $CHECKSTAT -s $TEST_34_SIZE $DIR/$tfile || \ + error "wrong expanded size after lock cancel" +} +run_test 34g "truncate long file ===============================" + test_35a() { cp /bin/sh $DIR/f35a chmod 444 $DIR/f35a @@ -1701,7 +1841,7 @@ test_36d() { run_test 36d "non-root OST utime check (open, utime) ===========" test_36e() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return mkdir -p $DIR/$tdir touch $DIR/$tdir/$tfile $RUNAS utime $DIR/$tdir/$tfile && \ @@ -1709,13 +1849,15 @@ test_36e() { } run_test 36e "utime on non-owned file (should return error) ====" -test_36f() { +subr_36fh() { + local fl="$1" + local LANG_SAVE=$LANG + local LC_LANG_SAVE=$LC_LANG export LANG=C LC_LANG=C # for date language DATESTR="Dec 20 2000" mkdir -p $DIR/$tdir - #define OBD_FAIL_OST_BRW_PAUSE_BULK 0x214 - lctl set_param fail_loc=0x80000214 + lctl set_param fail_loc=$fl date; date +%s cp /etc/hosts $DIR/$tdir/$tfile sync & # write RPC generated with "current" inode timestamp, but delayed @@ -1730,6 +1872,13 @@ test_36f() { echo "AFTER : $LS_AFTER" && \ echo "WANT : $DATESTR" && \ error "$DIR/$tdir/$tfile timestamps changed" || true + + export LANG=$LANG_SAVE LC_LANG=$LC_LANG_SAVE +} + +test_36f() { + #define OBD_FAIL_OST_BRW_PAUSE_BULK 0x214 + subr_36fh "0x80000214" } run_test 36f "utime on file racing with OST BRW write ==========" @@ -1748,6 +1897,12 @@ test_36g() { } run_test 36g "filter mod data cache expiry =====================" +test_36h() { + #define OBD_FAIL_OST_BRW_PAUSE_BULK2 0x227 + subr_36fh "0x80000227" +} +run_test 36h "utime on file racing with OST BRW write ==========" + test_37() { mkdir -p $DIR/$tdir echo f > $DIR/$tdir/fbugfile @@ -1948,6 +2103,73 @@ test_42d() { } run_test 42d "test complete truncate of file with cached dirty data" +page_size() { + getconf PAGE_SIZE +} + +test_42e() { # bug22074 + local TDIR=$DIR/${tdir}e + local pagesz=$(page_size) + local pages=16 + local files=$((OSTCOUNT * 500)) # hopefully 500 files on each OST + local proc_osc0="osc.${FSNAME}-OST0000-osc-[^MDT]*" + local max_dirty_mb + local warmup_files + + mkdir -p $TDIR + $LFS setstripe -c 1 $TDIR + createmany -o $TDIR/f $files + + max_dirty_mb=$($LCTL get_param -n $proc_osc0/max_dirty_mb) + + # we assume that with $OSTCOUNT files, at least one of them will + # be allocated on OST0. + warmup_files=$((OSTCOUNT * max_dirty_mb)) + createmany -o $TDIR/w $warmup_files + + # write a large amount of data into one file and sync, to get good + # avail_grant number from OST. + for ((i=0; i<$warmup_files; i++)); do + idx=$($LFS getstripe -i $TDIR/w$i) + [ $idx -ne 0 ] && continue + dd if=/dev/zero of=$TDIR/w$i bs="$max_dirty_mb"M count=1 + break + done + [ $i -gt $warmup_files ] && error "OST0 is still cold" + sync + $LCTL get_param $proc_osc0/cur_dirty_bytes + $LCTL get_param $proc_osc0/cur_grant_bytes + + # create as much dirty pages as we can while not to trigger the actual + # RPCs directly. but depends on the env, VFS may trigger flush during this + # period, hopefully we are good. + for ((i=0; i<$warmup_files; i++)); do + idx=$($LFS getstripe -i $TDIR/w$i) + [ $idx -ne 0 ] && continue + dd if=/dev/zero of=$TDIR/w$i bs=1M count=1 2>/dev/null + done + $LCTL get_param $proc_osc0/cur_dirty_bytes + $LCTL get_param $proc_osc0/cur_grant_bytes + + # perform the real test + $LCTL set_param $proc_osc0/rpc_stats 0 + for ((;i<$files; i++)); do + [ $($LFS getstripe -i $TDIR/f$i) -eq 0 ] || continue + dd if=/dev/zero of=$TDIR/f$i bs=$pagesz count=$pages 2>/dev/null + done + sync + $LCTL get_param $proc_osc0/rpc_stats + + $LCTL get_param $proc_osc0/rpc_stats | + while read PPR RRPC RPCT RCUM BAR WRPC WPCT WCUM; do + [ "$PPR" != "16:" ] && continue + [ $WPCT -lt 85 ] && error "$pages-page write RPCs only $WPCT% < 85%" + break # we only want the "pages per rpc" stat + done + rm -rf $TDIR +} +run_test 42e "verify sub-RPC writes are not done synchronously" + test_43() { mkdir -p $DIR/$tdir cp -p /bin/ls $DIR/$tdir/$tfile @@ -1995,7 +2217,7 @@ test_43c() { run_test 43c "md5sum of copy into lustre========================" test_44() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping 2-stripe test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping 2-stripe test" && return dd if=/dev/zero of=$DIR/f1 bs=4k count=1 seek=1023 dd if=$DIR/f1 bs=4k count=1 > /dev/null } @@ -2073,10 +2295,6 @@ test_45() { } run_test 45 "osc io page accounting ============================" -page_size() { - getconf PAGE_SIZE -} - # in a 2 stripe file (lov.sh), page 1023 maps to page 511 in its object. this # test tickles a bug where re-dirtying a page was failing to be mapped to the # objects offset and an assert hit when an rpc was built with 1023's mapped @@ -2094,7 +2312,7 @@ test_46() { } run_test 46 "dirtying a previously written page ================" -# test_47 is removed "Device nodes check" is moved to test_28 +# test_47 is removed "Device nodes check" is moved to test_28 test_48a() { # bug 2399 check_kernel_version 34 || return 0 @@ -2290,7 +2508,7 @@ test_51bb() { echo "mds $i: inodes count OLD ${OLDUSED[$i]} NEW ${NEWUSED[$i]}" [ ${OLDUSED[$i]} -lt ${NEWUSED[$i]} ] || rc=$((rc + 1)) done - + lctl set_param -n lmv.*.placement=$savePOLICY [ $rc -ne $MDSCOUNT ] || \ @@ -2308,7 +2526,7 @@ test_51c() { run_test 51c "rmdir .../t-0 --- .../t-$NUMTEST ====================" test_51d() { - [ "$OSTCOUNT" -lt "3" ] && skip "skipping test with few OSTs" && return + [ "$OSTCOUNT" -lt "3" ] && skip_env "skipping test with few OSTs" && return mkdir -p $DIR/d51d createmany -o $DIR/d51d/t- 1000 $LFS getstripe $DIR/d51d > $TMP/files @@ -2339,16 +2557,16 @@ test_52a() { [ -f $DIR/d52a/foo ] && chattr -a $DIR/d52a/foo mkdir -p $DIR/d52a touch $DIR/d52a/foo - chattr =a $DIR/d52a/foo || error "chattr =a failed" + chattr +a $DIR/d52a/foo || error "chattr +a failed" echo bar >> $DIR/d52a/foo || error "append bar failed" cp /etc/hosts $DIR/d52a/foo && error "cp worked" rm -f $DIR/d52a/foo 2>/dev/null && error "rm worked" link $DIR/d52a/foo $DIR/d52a/foo_link 2>/dev/null && error "link worked" echo foo >> $DIR/d52a/foo || error "append foo failed" mrename $DIR/d52a/foo $DIR/d52a/foo_ren && error "rename worked" - lsattr $DIR/d52a/foo | egrep -q "^-+a-+ $DIR/d52a/foo" || error "lsattr" + lsattr $DIR/d52a/foo | egrep -q "^-+a[-e]+ $DIR/d52a/foo" || error "lsattr" chattr -a $DIR/d52a/foo || error "chattr -a failed" - + cp -r $DIR/d52a /tmp/ rm -fr $DIR/d52a || error "cleanup rm failed" } run_test 52a "append-only flag test (should return errors) =====" @@ -2357,17 +2575,17 @@ test_52b() { [ -f $DIR/d52b/foo ] && chattr -i $DIR/d52b/foo mkdir -p $DIR/d52b touch $DIR/d52b/foo - chattr =i $DIR/d52b/foo || error - cat test > $DIR/d52b/foo && error - cp /etc/hosts $DIR/d52b/foo && error - rm -f $DIR/d52b/foo 2>/dev/null && error - link $DIR/d52b/foo $DIR/d52b/foo_link 2>/dev/null && error - echo foo >> $DIR/d52b/foo && error - mrename $DIR/d52b/foo $DIR/d52b/foo_ren && error + chattr +i $DIR/d52b/foo || error "chattr +i failed" + cat test > $DIR/d52b/foo && error "cat test worked" + cp /etc/hosts $DIR/d52b/foo && error "cp worked" + rm -f $DIR/d52b/foo 2>/dev/null && error "rm worked" + link $DIR/d52b/foo $DIR/d52b/foo_link 2>/dev/null && error "link worked" + echo foo >> $DIR/d52b/foo && error "echo worked" + mrename $DIR/d52b/foo $DIR/d52b/foo_ren && error "rename worked" [ -f $DIR/d52b/foo ] || error [ -f $DIR/d52b/foo_ren ] && error - lsattr $DIR/d52b/foo | egrep -q "^-+i-+ $DIR/d52b/foo" || error - chattr -i $DIR/d52b/foo || error + lsattr $DIR/d52b/foo | egrep -q "^-+i[-e]+ $DIR/d52b/foo" || error "lsattr" + chattr -i $DIR/d52b/foo || error "chattr failed" rm -fr $DIR/d52b || error } @@ -2399,8 +2617,8 @@ test_53() { run_test 53 "verify that MDS and OSTs agree on pre-creation ====" test_54a() { - [ ! -f "$SOCKETSERVER" ] && skip "no socketserver, skipping" && return - [ ! -f "$SOCKETCLIENT" ] && skip "no socketclient, skipping" && return + [ ! -f "$SOCKETSERVER" ] && skip_env "no socketserver, skipping" && return + [ ! -f "$SOCKETCLIENT" ] && skip_env "no socketclient, skipping" && return $SOCKETSERVER $DIR/socket $SOCKETCLIENT $DIR/socket || error $MUNLINK $DIR/socket @@ -2482,7 +2700,7 @@ check_fstype() { test_55() { rm -rf $DIR/d55 mkdir $DIR/d55 - check_fstype && skip "can't find fs $FSTYPE" && return + client_only && skip "Not a server" && return mount -t $FSTYPE -o loop,iopen $EXT2_DEV $DIR/d55 || error "mounting" touch $DIR/d55/foo $IOPENTEST1 $DIR/d55/foo $DIR/d55 || error "running $IOPENTEST1" @@ -2532,13 +2750,15 @@ test_56a() { # was test_56 error "lfs getstripe --obd wrong_uuid should return error message" [ "$OSTCOUNT" -lt 2 ] && \ - skip "skipping other lfs getstripe --obd test" && return - FILENUM=`$GETSTRIPE --recursive $DIR/d56 | sed -n '/^[ ]*1[ ]/p' | wc -l` - OBDUUID=`$GETSTRIPE --recursive $DIR/d56 | sed -n '/^[ ]*1:/p' | awk '{print $2}'` - FOUND=`$GETSTRIPE -r --obd $OBDUUID $DIR/d56 | wc -l` + skip_env "skipping other lfs getstripe --obd test" && return + OSTIDX=1 + OBDUUID=$(lfs osts | grep ${OSTIDX}": " | awk '{print $2}') + FILENUM=`$GETSTRIPE -ir $DIR/d56 | grep -x $OSTIDX | wc -l` + FOUND=`$GETSTRIPE -r --obd $OBDUUID $DIR/d56 | grep obdidx | wc -l` [ $FOUND -eq $FILENUM ] || \ error "lfs getstripe --obd wrong: found $FOUND, expected $FILENUM" - [ `$GETSTRIPE -r -v --obd $OBDUUID $DIR/d56 | sed '/^[ ]*1[ ]/d' |\ + [ `$GETSTRIPE -r -v --obd $OBDUUID $DIR/d56 | \ + sed '/^[ ]*'${OSTIDX}'[ ]/d' |\ sed -n '/^[ ]*[0-9][0-9]*[ ]/p' | wc -l` -eq 0 ] || \ error "lfs getstripe --obd wrong: should not show file on other obd" echo "lfs getstripe --obd passed." @@ -2618,7 +2838,7 @@ run_test 56h "check lfs find ! -name =============================" test_56i() { tdir=${tdir}i mkdir -p $DIR/$tdir - UUID=`$GETSTRIPE $DIR/$tdir | awk '/0: / { print $2 }'` + UUID=`$LFS osts | awk '/0: / { print $2 }'` OUT="`$LFIND -ost $UUID $DIR/$tdir`" [ "$OUT" ] && error "$LFIND returned directory '$OUT'" || true } @@ -2692,7 +2912,7 @@ test_56o() { run_test 56o "check lfs find -mtime for old files ==========================" test_56p() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return TDIR=$DIR/${tdir}g rm -rf $TDIR @@ -2715,7 +2935,7 @@ test_56p() { run_test 56p "check lfs find -uid and ! -uid ===============================" test_56q() { - [ $RUNAS_ID -eq $UID ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return TDIR=$DIR/${tdir}g rm -rf $TDIR @@ -2764,7 +2984,7 @@ test_57b() { mkdir -p $dir || error "creating $dir" local num=$(get_mds_dir $dir) local mymds=mds$num - + echo "mcreating $FILECOUNT files" createmany -m $dir/f 1 $FILECOUNT || \ error "creating files in $dir" @@ -2805,7 +3025,7 @@ test_57b() { run_test 57b "default LOV EAs are stored inside large inodes ===" test_58() { - [ -z "$(which wiretest 2>/dev/null)" ] && skip "could not find wiretest" && return + [ -z "$(which wiretest 2>/dev/null)" ] && skip_env "could not find wiretest" && return wiretest } run_test 58 "verify cross-platform wire constants ==============" @@ -2823,7 +3043,7 @@ run_test 59 "verify cancellation of llog records async =========" TEST60_HEAD="test_60 run $RANDOM" test_60a() { - [ ! -f run-llog.sh ] && skip "missing subtest run-llog.sh" && return + [ ! -f run-llog.sh ] && skip_env "missing subtest run-llog.sh" && return log "$TEST60_HEAD - from kernel mode" sh run-llog.sh } @@ -2942,7 +3162,7 @@ test_64a () { run_test 64a "verify filter grant calculations (in kernel) =====" test_64b () { - [ ! -f oos.sh ] && skip "missing subtest oos.sh" && return + [ ! -f oos.sh ] && skip_env "missing subtest oos.sh" && return sh oos.sh $MOUNT } run_test 64b "check out-of-space detection on client ===========" @@ -3056,7 +3276,7 @@ test_65j() { # bug6367 run_test 65j "set default striping on root directory (bug 6367)=" test_65k() { # bug11679 - [ "$OSTCOUNT" -lt 2 ] && skip "too few OSTs" && return + [ "$OSTCOUNT" -lt 2 ] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return echo "Check OST status: " @@ -3105,6 +3325,7 @@ test_66() { run_test 66 "update inode blocks count on client ===============" LLOOP= +LLITELOOPLOAD= cleanup_68() { trap 0 if [ ! -z "$LLOOP" ]; then @@ -3116,6 +3337,10 @@ cleanup_68() { rm -f $LLOOP unset LLOOP fi + if [ ! -z "$LLITELOOPLOAD" ]; then + rmmod llite_lloop + unset LLITELOOPLOAD + fi rm -f $DIR/f68* } @@ -3129,17 +3354,23 @@ swap_used() { # test case for lloop driver, basic function test_68a() { - [ "$UID" != 0 ] && skip "must run as root" && return + [ "$UID" != 0 ] && skip_env "must run as root" && return - grep -q llite_lloop /proc/modules - [ $? -ne 0 ] && skip "can't find module llite_lloop" && return + trap cleanup_68 EXIT + + if ! module_loaded llite_lloop; then + if load_module llite/llite_lloop; then + LLITELOOPLOAD=yes + else + skip_env "can't find module llite_lloop" + return + fi + fi LLOOP=$TMP/lloop.`date +%s`.`date +%N` dd if=/dev/zero of=$DIR/f68a bs=4k count=1024 $LCTL blockdev_attach $DIR/f68a $LLOOP || error "attach failed" - trap cleanup_68 EXIT - directio rdwr $LLOOP 0 1024 4096 || error "direct write failed" directio rdwr $LLOOP 0 1025 4096 && error "direct write should fail" @@ -3150,7 +3381,7 @@ run_test 68a "lloop driver - basic test ========================" # excercise swapping to lustre by adding a high priority swapfile entry # and then consuming memory until it is used. test_68b() { # was test_68 - [ "$UID" != 0 ] && skip "must run as root" && return + [ "$UID" != 0 ] && skip_env "must run as root" && return lctl get_param -n devices | grep -q obdfilter && \ skip "local OST" && return @@ -3221,11 +3452,11 @@ run_test 71 "Running dbench on lustre (don't segment fault) ====" test_72() { # bug 5695 - Test that on 2.6 remove_suid works properly check_kernel_version 43 || return 0 - [ "$RUNAS_ID" = "$UID" ] && skip "RUNAS_ID = UID = $UID -- skipping" && return + [ "$RUNAS_ID" = "$UID" ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return # Check that testing environment is properly set up. Skip if not FAIL_ON_ERROR=false check_runas_id_ret $RUNAS_ID $RUNAS_ID $RUNAS || { - skip "User $RUNAS_ID does not exist - skipping" + skip_env "User $RUNAS_ID does not exist - skipping" return 0 } # We had better clear the $DIR to get enough space for dd @@ -3301,113 +3532,6 @@ test_74b() { # bug 13310 } run_test 74b "ldlm_enqueue freed-export error path, touch (shouldn't LBUG)" -JOIN=${JOIN:-"lfs join"} -F75=$DIR/f75 -F128k=${F75}_128k -FHEAD=${F75}_head -FTAIL=${F75}_tail -export T75_PREP=no -test75_prep() { - [ $T75_PREP = "yes" ] && return - echo "using F75=$F75, F128k=$F128k, FHEAD=$FHEAD, FTAIL=$FTAIL" - - dd if=/dev/urandom of=${F75}_128k bs=128k count=1 || error "dd failed" - log "finished dd" - chmod 777 ${F128k} - T75_PREP=yes -} - -test_75a() { - test75_prep - - cp -p ${F128k} ${FHEAD} - log "finished cp to $FHEAD" - cp -p ${F128k} ${FTAIL} - log "finished cp to $FTAIL" - cat ${F128k} ${F128k} > ${F75}_sim_sim - - $JOIN ${FHEAD} ${FTAIL} || error "join ${FHEAD} ${FTAIL} error" - log "finished join $FHEAD to ${F75}_sim_sim" - cmp ${FHEAD} ${F75}_sim_sim || error "${FHEAD} ${F75}_sim_sim differ" - log "finished cmp $FHEAD to ${F75}_sim_sim" - $CHECKSTAT -a ${FTAIL} || error "tail ${FTAIL} still exist after join" -} -run_test 75a "TEST join file ====================================" - -test_75b() { - test75_prep - - cp -p ${F128k} ${FTAIL} - cat ${F75}_sim_sim >> ${F75}_join_sim - cat ${F128k} >> ${F75}_join_sim - $JOIN ${FHEAD} ${FTAIL} || error "join ${FHEAD} ${FTAIL} error" - cmp ${FHEAD} ${F75}_join_sim || \ - error "${FHEAD} ${F75}_join_sim are different" - $CHECKSTAT -a ${FTAIL} || error "tail ${FTAIL} exist after join" -} -run_test 75b "TEST join file 2 ==================================" - -test_75c() { - test75_prep - - cp -p ${F128k} ${FTAIL} - cat ${F128k} >> ${F75}_sim_join - cat ${F75}_join_sim >> ${F75}_sim_join - $JOIN ${FTAIL} ${FHEAD} || error "join error" - cmp ${FTAIL} ${F75}_sim_join || \ - error "${FTAIL} ${F75}_sim_join are different" - $CHECKSTAT -a ${FHEAD} || error "tail ${FHEAD} exist after join" -} -run_test 75c "TEST join file 3 ==================================" - -test_75d() { - test75_prep - - cp -p ${F128k} ${FHEAD} - cp -p ${F128k} ${FHEAD}_tmp - cat ${F75}_sim_sim >> ${F75}_join_join - cat ${F75}_sim_join >> ${F75}_join_join - $JOIN ${FHEAD} ${FHEAD}_tmp || error "join ${FHEAD} ${FHEAD}_tmp error" - $JOIN ${FHEAD} ${FTAIL} || error "join ${FHEAD} ${FTAIL} error" - cmp ${FHEAD} ${F75}_join_join ||error "${FHEAD} ${F75}_join_join differ" $CHECKSTAT -a ${FHEAD}_tmp || error "${FHEAD}_tmp exist after join" - $CHECKSTAT -a ${FTAIL} || error "tail ${FTAIL} exist after join (2)" -} -run_test 75d "TEST join file 4 ==================================" - -test_75e() { - test75_prep - - rm -rf ${FHEAD} || "delete join file error" -} -run_test 75e "TEST join file 5 (remove joined file) =============" - -test_75f() { - test75_prep - - cp -p ${F128k} ${F75}_join_10_compare - cp -p ${F128k} ${F75}_join_10 - for ((i = 0; i < 10; i++)); do - cat ${F128k} >> ${F75}_join_10_compare - cp -p ${F128k} ${FTAIL} - $JOIN ${F75}_join_10 ${FTAIL} || \ - error "join ${F75}_join_10 ${FTAIL} error" - $CHECKSTAT -a ${FTAIL} || error "tail file exist after join" - done - cmp ${F75}_join_10 ${F75}_join_10_compare || \ - error "files ${F75}_join_10 ${F75}_join_10_compare differ" -} -run_test 75f "TEST join file 6 (join 10 files) ==================" - -test_75g() { - [ ! -f ${F75}_join_10 ] && echo "${F75}_join_10 missing" && return - $LFS getstripe ${F75}_join_10 - - $OPENUNLINK ${F75}_join_10 ${F75}_join_10 || error "files unlink open" - - ls -l $F75* -} -run_test 75g "TEST join file 7 (open unlink) ====================" - num_inodes() { awk '/lustre_inode_cache/ {print $2; exit}' /proc/slabinfo } @@ -3484,7 +3608,6 @@ test_77b() { # bug 10889 error "dd error: $?" lctl set_param fail_loc=0 set_checksums 0 - rm -f $DIR/f77b } run_test 77b "checksum error on client write ====================" @@ -3502,6 +3625,7 @@ test_77c() { # bug 10889 done set_checksums 0 set_checksum_type $ORIG_CSUM_TYPE + rm -f $DIR/f77b } run_test 77c "checksum error on client read ===================" @@ -3616,7 +3740,9 @@ rm -f $F77_TMP unset F77_TMP test_78() { # bug 10901 - NSEQ=5 + remote_ost || { skip_env "local OST" && return; } + + NSEQ=5 F78SIZE=$(($(awk '/MemFree:/ { print $2 }' /proc/meminfo) / 1024)) echo "MemFree: $F78SIZE, Max file size: $MAXFREE" MEMTOTAL=$(($(awk '/MemTotal:/ { print $2 }' /proc/meminfo) / 1024)) @@ -3701,20 +3827,20 @@ test_80() { # bug 10718 run_test 80 "Page eviction is equally fast at high offsets too ====" test_99a() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && \ + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && \ return mkdir -p $DIR/d99cvsroot chown $RUNAS_ID $DIR/d99cvsroot local oldPWD=$PWD # bug 13584, use $TMP as working dir cd $TMP - + $RUNAS cvs -d $DIR/d99cvsroot init || error cd $oldPWD } run_test 99a "cvs init =========================================" test_99b() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && return + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && return [ ! -d $DIR/d99cvsroot ] && test_99a cd /etc/init.d # some versions of cvs import exit(1) when asked to import links or @@ -3727,7 +3853,7 @@ test_99b() { run_test 99b "cvs import =======================================" test_99c() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && return + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && return [ ! -d $DIR/d99cvsroot ] && test_99b cd $DIR mkdir -p $DIR/d99reposname @@ -3737,7 +3863,7 @@ test_99c() { run_test 99c "cvs checkout =====================================" test_99d() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && return + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && return [ ! -d $DIR/d99cvsroot ] && test_99c cd $DIR/d99reposname $RUNAS touch foo99 @@ -3746,7 +3872,7 @@ test_99d() { run_test 99d "cvs add ==========================================" test_99e() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && return + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && return [ ! -d $DIR/d99cvsroot ] && test_99c cd $DIR/d99reposname $RUNAS cvs update @@ -3754,7 +3880,7 @@ test_99e() { run_test 99e "cvs update =======================================" test_99f() { - [ -z "$(which cvs 2>/dev/null)" ] && skip "could not find cvs" && return + [ -z "$(which cvs 2>/dev/null)" ] && skip_env "could not find cvs" && return [ ! -d $DIR/d99cvsroot ] && test_99d cd $DIR/d99reposname $RUNAS cvs commit -m 'nomsg' foo99 @@ -3782,10 +3908,10 @@ test_100() { if [ $LPORT -ge 1024 ]; then echo "bad: $PROT $SND $RCV $LOCAL $REMOTE $STAT" netstat -tna - error "local: $LPORT > 1024, remote: $RPORT" + error_exit "local: $LPORT > 1024, remote: $RPORT" fi done - [ "$rc" = 0 ] || error "privileged port not found" ) + [ "$rc" = 0 ] || error_exit "privileged port not found" ) } run_test 100 "check local port using privileged port ===========" @@ -3894,7 +4020,7 @@ ra_check_101() { } test_101b() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping stride IO stride-ahead test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping stride IO stride-ahead test" && return local STRIPE_SIZE=1048576 local STRIDE_SIZE=$((STRIPE_SIZE*OSTCOUNT)) local FILE_LENGTH=$((STRIPE_SIZE*100)) @@ -3919,6 +4045,51 @@ test_101b() { } run_test 101b "check stride-io mode read-ahead =================" +set_read_ahead() { + lctl get_param -n llite.*.max_read_ahead_mb | head -n 1 + lctl set_param -n llite.*.max_read_ahead_mb $1 > /dev/null 2>&1 +} + +test_101d() { + local file=$DIR/$tfile + local size=${FILESIZE_101c:-500} + local ra_MB=${READAHEAD_MB:-40} + + local space=$(df -P $DIR | tail -n 1 | awk '{ print $4 }') + [ $space -gt $((size / 1024)) ] || + { skip "Need free space ${size}M, have $space" && return; } + + echo Creating ${size}M test file $file + dd if=/dev/zero of=$file bs=1M count=$size + echo Cancel LRU locks on lustre client to flush the client cache + cancel_lru_locks osc + + echo Disable read-ahead + local old_READAHEAD=$(set_read_ahead 0) + + echo Reading the test file $file with read-ahead disabled + time_ra_OFF=$(do_and_time "dd if=$file of=/dev/null bs=1M count=$size") + + echo Cancel LRU locks on lustre client to flush the client cache + cancel_lru_locks osc + echo Enable read-ahead with ${ra_MB}MB + set_read_ahead $ra_MB + + echo Reading the test file $file with read-ahead enabled + time_ra_ON=$(do_and_time "dd if=$file of=/dev/null bs=1M count=$size") + + echo read-ahead disabled time read $time_ra_OFF + echo read-ahead enabled time read $time_ra_ON + + set_read_ahead $old_READAHEAD + rm -f $file + + [ $time_ra_ON -lt $time_ra_OFF ] || + error "read-ahead enabled time read (${time_ra_ON}s) is more than + read-ahead disabled time read (${time_ra_OFF}s) filesize ${size}M" +} +run_test 101d "file read with and without read-ahead enabled =================" + export SETUP_TEST102=no setup_test102() { [ "$SETUP_TEST102" = "yes" ] && return @@ -3964,10 +4135,10 @@ test_102a() { rm -f $testfile touch $testfile - [ "$UID" != 0 ] && skip "must run as root" && return - [ -z "`lctl get_param -n mdc.*-mdc-*.connect_flags | grep xattr`" ] && skip "must have user_xattr" && return + [ "$UID" != 0 ] && skip_env "must run as root" && return + [ -z "`lctl get_param -n mdc.*-mdc-*.connect_flags | grep xattr`" ] && skip_env "must have user_xattr" && return - [ -z "$(which setfattr 2>/dev/null)" ] && skip "could not find setfattr" && return + [ -z "$(which setfattr 2>/dev/null)" ] && skip_env "could not find setfattr" && return echo "set/get xattr..." setfattr -n trusted.name1 -v value1 $testfile || error @@ -4010,7 +4181,7 @@ run_test 102a "user xattr test ==================================" test_102b() { # b10930: get/set/list trusted.lov xattr echo "get/set/list trusted.lov xattr ..." - [ "$OSTCOUNT" -lt "2" ] && skip "skipping 2-stripe test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping 2-stripe test" && return local testfile=$DIR/$tfile $SETSTRIPE -s 65536 -i 1 -c 2 $testfile || error "setstripe failed" getfattr -d -m "^trusted" $testfile 2> /dev/null | \ @@ -4019,9 +4190,9 @@ test_102b() { local testfile2=${testfile}2 local value=`getfattr -n trusted.lov $testfile 2> /dev/null | \ grep "trusted.lov" |sed -e 's/[^=]\+=//'` - + $MCREATE $testfile2 - setfattr -n trusted.lov -v $value $testfile2 + setfattr -n trusted.lov -v $value $testfile2 local tmp_file=${testfile}3 $GETSTRIPE -v $testfile2 > $tmp_file local stripe_size=`grep "size" $tmp_file| awk '{print $2}'` @@ -4035,7 +4206,7 @@ run_test 102b "getfattr/setfattr for trusted.lov EAs ============" test_102c() { # b10930: get/set/list lustre.lov xattr echo "get/set/list lustre.lov xattr ..." - [ "$OSTCOUNT" -lt "2" ] && skip "skipping 2-stripe test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping 2-stripe test" && return mkdir -p $DIR/$tdir chown $RUNAS_ID $DIR/$tdir local testfile=$DIR/$tdir/$tfile @@ -4046,9 +4217,9 @@ test_102c() { local testfile2=${testfile}2 local value=`getfattr -n lustre.lov $testfile 2> /dev/null | \ grep "lustre.lov" |sed -e 's/[^=]\+=//' ` - + $RUNAS $MCREATE $testfile2 - $RUNAS setfattr -n lustre.lov -v $value $testfile2 + $RUNAS setfattr -n lustre.lov -v $value $testfile2 local tmp_file=${testfile}3 $RUNAS $GETSTRIPE -v $testfile2 > $tmp_file local stripe_size=`grep "size" $tmp_file| awk '{print $2}'` @@ -4117,8 +4288,8 @@ find_lustre_tar() { test_102d() { # b10930: tar test for trusted.lov xattr TAR=$(find_lustre_tar) - [ -z "$TAR" ] && skip "lustre-aware tar is not installed" && return - [ "$OSTCOUNT" -lt "2" ] && skip "skipping N-stripe test" && return + [ -z "$TAR" ] && skip_env "lustre-aware tar is not installed" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping N-stripe test" && return setup_test102 mkdir -p $DIR/d102d $TAR xf $TMP/f102.tar -C $DIR/d102d --xattrs @@ -4130,8 +4301,8 @@ run_test 102d "tar restore stripe info from tarfile,not keep osts ===========" test_102f() { # b10930: tar test for trusted.lov xattr TAR=$(find_lustre_tar) - [ -z "$TAR" ] && skip "lustre-aware tar is not installed" && return - [ "$OSTCOUNT" -lt "2" ] && skip "skipping N-stripe test" && return + [ -z "$TAR" ] && skip_env "lustre-aware tar is not installed" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping N-stripe test" && return setup_test102 mkdir -p $DIR/d102f cd $DIR @@ -4145,7 +4316,7 @@ test_102h() { # bug 15777 [ -z $(lctl get_param -n mdc.*.connect_flags | grep xattr) ] && skip "must have user_xattr" && return [ -z "$(which setfattr 2>/dev/null)" ] && - skip "could not find setfattr" && return + skip_env "could not find setfattr" && return XBIG=trusted.big XSIZE=1024 @@ -4197,8 +4368,8 @@ run_test 102i "lgetxattr test on symbolic link ============" test_102j() { TAR=$(find_lustre_tar) - [ -z "$TAR" ] && skip "lustre-aware tar is not installed" && return - [ "$OSTCOUNT" -lt "2" ] && skip "skipping N-stripe test" && return + [ -z "$TAR" ] && skip_env "lustre-aware tar is not installed" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping N-stripe test" && return setup_test102 "$RUNAS" mkdir -p $DIR/d102j chown $RUNAS_ID $DIR/d102j @@ -4208,6 +4379,28 @@ test_102j() { } run_test 102j "non-root tar restore stripe info from tarfile, not keep osts ===" +test_102k() { + touch $DIR/$tfile + # b22187 just check that does not crash for regular file. + setfattr -n trusted.lov $DIR/$tfile + # b22187 'setfattr -n trusted.lov' should work as remove LOV EA for directories + local test_kdir=$DIR/d102k + mkdir $test_kdir + local default_size=`$GETSTRIPE -s $test_kdir` + local default_count=`$GETSTRIPE -c $test_kdir` + local default_offset=`$GETSTRIPE -o $test_kdir` + $SETSTRIPE -s 65536 -i 1 -c 2 $test_kdir || error 'dir setstripe failed' + setfattr -n trusted.lov $test_kdir + local stripe_size=`$GETSTRIPE -s $test_kdir` + local stripe_count=`$GETSTRIPE -c $test_kdir` + local stripe_offset=`$GETSTRIPE -o $test_kdir` + [ $stripe_size -eq $default_size ] || error "stripe size $stripe_size != $default_size" + [ $stripe_count -eq $default_count ] || error "stripe count $stripe_count != $default_count" + [ $stripe_offset -eq $default_offset ] || error "stripe offset $stripe_offset != $default_offset" + rm -rf $DIR/$tfile $test_kdir +} +run_test 102k "setfattr without parameter of value shouldn't cause a crash" + cleanup_test102 run_acl_subtest() @@ -4217,9 +4410,9 @@ run_acl_subtest() } test_103 () { - [ "$UID" != 0 ] && skip "must run as root" && return + [ "$UID" != 0 ] && skip_env "must run as root" && return [ -z "$(lctl get_param -n mdc.*-mdc-*.connect_flags | grep acl)" ] && skip "must have acl enabled" && return - [ -z "$(which setfacl 2>/dev/null)" ] && skip "could not find setfacl" && return + [ -z "$(which setfacl 2>/dev/null)" ] && skip_env "could not find setfacl" && return $GSS && skip "could not run under gss" && return declare -a identity_old @@ -4235,19 +4428,19 @@ test_103 () { echo "performing cp ..." run_acl_subtest cp || error echo "performing getfacl-noacl..." - run_acl_subtest getfacl-noacl || error + run_acl_subtest getfacl-noacl || error "getfacl-noacl test failed" echo "performing misc..." - run_acl_subtest misc || error + run_acl_subtest misc || error "misc test failed" echo "performing permissions..." - run_acl_subtest permissions || error + run_acl_subtest permissions || error "permissions failed" echo "performing setfacl..." - run_acl_subtest setfacl || error + run_acl_subtest setfacl || error "setfacl test failed" # inheritance test got from HP echo "performing inheritance..." - cp $LUSTRE/tests/acl/make-tree . || error - chmod +x make-tree || error - run_acl_subtest inheritance || error + cp $LUSTRE/tests/acl/make-tree . || error "cannot copy make-tree" + chmod +x make-tree || error "chmod +x failed" + run_acl_subtest inheritance || error "inheritance test failed" rm -f make-tree cd $SAVE_PWD @@ -4261,7 +4454,7 @@ test_103 () { } run_test 103 "acl test =========================================" -test_104() { +test_104a() { touch $DIR/$tfile lfs df || error "lfs df failed" lfs df -ih || error "lfs df -ih failed" @@ -4269,7 +4462,7 @@ test_104() { lfs df -i $DIR || error "lfs df -i $DIR failed" lfs df $DIR/$tfile || error "lfs df $DIR/$tfile failed" lfs df -ih $DIR/$tfile || error "lfs df -ih $DIR/$tfile failed" - + OSC=`lctl get_param -n devices | awk '/-osc-/ {print $4}' | head -n 1` lctl --device %$OSC deactivate lfs df || error "lfs df with deactivated OSC failed" @@ -4277,7 +4470,18 @@ test_104() { lfs df || error "lfs df with reactivated OSC failed" rm -f $DIR/$tfile } -run_test 104 "lfs df [-ih] [path] test =========================" +run_test 104a "lfs df [-ih] [path] test =========================" + +test_104b() { + [ $RUNAS_ID -eq $UID ] && skip_env "RUNAS_ID = UID = $UID -- skipping" && return + chmod 666 /dev/obd + denied_cnt=$((`$RUNAS $LFS check servers 2>&1 | grep "Permission denied" | wc -l`)) + if [ $denied_cnt -ne 0 ]; + then + error "lfs check servers test failed" + fi +} +run_test 104b "$RUNAS lfs check servers test ====================" test_105a() { # doesn't work on 2.4 kernels @@ -4426,11 +4630,10 @@ free_min_max () { } test_116() { - [ "$OSTCOUNT" -lt "2" ] && skip "$OSTCOUNT < 2 OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "$OSTCOUNT < 2 OSTs" && return echo -n "Free space priority " lctl get_param -n lov.*-clilov-*.qos_prio_free - DELAY=$(lctl get_param -n lov.*-clilov-*.qos_maxage | head -1 | awk '{print $1}') declare -a AVAIL free_min_max [ $MINV -gt 960000 ] && skip "too much free space in OST$MINI, skip" &&\ @@ -4451,7 +4654,7 @@ test_116() { done FILL=$(($MINV / 4)) sync - sleep $DELAY + sleep_maxage free_min_max DIFF=$(($MAXV - $MINV)) @@ -4480,7 +4683,7 @@ test_116() { done echo "wrote $i 200k files" sync - sleep $DELAY + sleep_maxage echo "Note: free space may not be updated, so measurements might be off" free_min_max @@ -4547,7 +4750,7 @@ reset_async() { test_118a() #bug 11710 { reset_async - + multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c DIRTY=$(lctl get_param -n llite.*.dump_page_cache | grep -c dirty) WRITEBACK=$(lctl get_param -n llite.*.dump_page_cache | grep -c writeback) @@ -4591,7 +4794,7 @@ test_118b() # until a subsequent RPC completes successfully without error. multiop $DIR/$tfile Ow4096yc rm -f $DIR/$tfile - + return 0 } run_test 118b "Reclaim dirty pages on fatal error ==========" @@ -4633,7 +4836,7 @@ test_118c() if [[ $DIRTY -ne 0 || $WRITEBACK -ne 0 ]]; then error "Dirty pages not flushed to disk, dirty=$DIRTY, writeback=$WRITEBACK" fi - + rm -f $DIR/$tfile echo "Dirty pages flushed via fsync on EROFS" return 0 @@ -4649,7 +4852,7 @@ test_118d() #define OBD_FAIL_OST_BRW_PAUSE_BULK set_nodes_failloc "$(osts_nodes)" 0x214 # multiop should block due to fsync until pages are written - multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c & + multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c & MULTIPID=$! sleep 1 @@ -4691,7 +4894,7 @@ test_118f() { if [[ $RC -eq 0 ]]; then error "Must return error due to dropped pages, rc=$RC" fi - + lctl set_param fail_loc=0x0 LOCKED=$(lctl get_param -n llite.*.dump_page_cache | grep -c locked) @@ -4723,7 +4926,7 @@ test_118g() { # simulate local -ENOMEM multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c RC=$? - + lctl set_param fail_loc=0 if [[ $RC -eq 0 ]]; then error "Must return error due to dropped pages, rc=$RC" @@ -4736,7 +4939,7 @@ test_118g() { if [[ $LOCKED -ne 0 ]]; then error "Locked pages remain in cache, locked=$LOCKED" fi - + if [[ $DIRTY -ne 0 || $WRITEBACK -ne 0 ]]; then error "Dirty pages not flushed to disk, dirty=$DIRTY, writeback=$WRITEBACK" fi @@ -4759,7 +4962,7 @@ test_118h() { # Should simulate ENOMEM error which is recoverable and should be handled by timeout multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c RC=$? - + set_nodes_failloc "$(osts_nodes)" 0 if [[ $RC -eq 0 ]]; then error "Must return error due to dropped pages, rc=$RC" @@ -4772,7 +4975,7 @@ test_118h() { if [[ $LOCKED -ne 0 ]]; then error "Locked pages remain in cache, locked=$LOCKED" fi - + if [[ $DIRTY -ne 0 || $WRITEBACK -ne 0 ]]; then error "Dirty pages not flushed to disk, dirty=$DIRTY, writeback=$WRITEBACK" fi @@ -4791,13 +4994,13 @@ test_118i() { #define OBD_FAIL_OST_BRW_WRITE_BULK 0x20e set_nodes_failloc "$(osts_nodes)" 0x20e - + # Should simulate ENOMEM error which is recoverable and should be handled by timeout multiop $DIR/$tfile oO_CREAT:O_RDWR:O_SYNC:w4096c & PID=$! sleep 5 set_nodes_failloc "$(osts_nodes)" 0 - + wait $PID RC=$? if [[ $RC -ne 0 ]]; then @@ -4810,7 +5013,7 @@ test_118i() { if [[ $LOCKED -ne 0 ]]; then error "Locked pages remain in cache, locked=$LOCKED" fi - + if [[ $DIRTY -ne 0 || $WRITEBACK -ne 0 ]]; then error "Dirty pages not flushed to disk, dirty=$DIRTY, writeback=$WRITEBACK" fi @@ -4844,7 +5047,7 @@ test_118j() { if [[ $LOCKED -ne 0 ]]; then error "Locked pages remain in cache, locked=$LOCKED" fi - + # in recoverable error on OST we want resend and stay until it finished if [[ $DIRTY -ne 0 || $WRITEBACK -ne 0 ]]; then error "Dirty pages not flushed to disk, dirty=$DIRTY, writeback=$WRITEBACK" @@ -4898,7 +5101,7 @@ run_test 119a "Short directIO read must return actual read amount" test_119b() # bug 11737 { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping 2-stripe test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping 2-stripe test" && return $SETSTRIPE -c 2 $DIR/$tfile || error "setstripe failed" dd if=/dev/zero of=$DIR/$tfile bs=1M count=1 seek=1 || error "dd failed" @@ -5126,11 +5329,11 @@ run_test 120g "Early Lock Cancel: performance test" test_121() { #bug #10589 rm -rf $DIR/$tfile - writes=$(LANG=C dd if=/dev/zero of=$DIR/$tfile count=1 2>&1 | awk -F '+' '/out/ {print $1}') + writes=$(LANG=C dd if=/dev/zero of=$DIR/$tfile count=1 2>&1 | awk -F '+' '/out$/ {print $1}') #define OBD_FAIL_LDLM_CANCEL_RACE 0x310 lctl set_param fail_loc=0x310 cancel_lru_locks osc > /dev/null - reads=$(LANG=C dd if=$DIR/$tfile of=/dev/null 2>&1 | awk -F '+' '/in/ {print $1}') + reads=$(LANG=C dd if=$DIR/$tfile of=/dev/null 2>&1 | awk -F '+' '/in$/ {print $1}') lctl set_param fail_loc=0 [ "$reads" -eq "$writes" ] || error "read" $reads "blocks, must be" $writes } @@ -5139,8 +5342,8 @@ run_test 121 "read cancel race =========" test_123a() { # was test 123, statahead(bug 11401) SLOWOK=0 if [ -z "$(grep "processor.*: 1" /proc/cpuinfo)" ]; then - log "testing on UP system. Performance may be not as good as expected." - SLOWOK=1 + log "testing on UP system. Performance may be not as good as expected." + SLOWOK=1 fi rm -rf $DIR/$tdir @@ -5172,48 +5375,32 @@ test_123a() { # was test 123, statahead(bug 11401) etime=`date +%s` delta_sa=$((etime - stime)) log "ls $i files with statahead: $delta_sa sec" - lctl get_param -n llite.*.statahead_stats + lctl get_param -n llite.*.statahead_stats ewrong=`lctl get_param -n llite.*.statahead_stats | grep "statahead wrong:" | awk '{print $3}'` - if [ $swrong -lt $ewrong ]; then - log "statahead was stopped, maybe too many locks held!" - fi - - [ $delta -eq 0 ] && continue + [ $swrong -lt $ewrong ] && log "statahead was stopped, maybe too many locks held!" + [ $delta -eq 0 -o $delta_sa -eq 0 ] && continue if [ $((delta_sa * 100)) -gt $((delta * 105)) -a $delta_sa -gt $((delta + 2)) ]; then + max=`lctl get_param -n llite.*.statahead_max | head -n 1` + lctl set_param -n llite.*.statahead_max 0 + lctl get_param llite.*.statahead_max + cancel_lru_locks mdc + cancel_lru_locks osc + stime=`date +%s` + time ls -l $DIR/$tdir | wc -l + etime=`date +%s` + delta=$((etime - stime)) + log "ls $i files again without statahead: $delta sec" + lctl set_param llite.*.statahead_max=$max + if [ $((delta_sa * 100)) -gt $((delta * 105)) -a $delta_sa -gt $((delta + 2)) ]; then if [ $SLOWOK -eq 0 ]; then error "ls $i files is slower with statahead!" - - max=`lctl get_param -n llite.*.statahead_max | head -n 1` - lctl set_param -n llite.*.statahead_max 0 - lctl get_param llite.*.statahead_max - cancel_lru_locks mdc - cancel_lru_locks osc - $LCTL clear - stime=`date +%s` - time ls -l $DIR/$tdir | wc -l - etime=`date +%s` - $LCTL dk $TMP/lustre_${TESTSUITE}_${TESTNAME}_${i}_disable.$(etime) - delta=$((etime - stime)) - log "ls $i files without statahead: $delta sec, dump to $TMP/lustre_${TESTSUITE}_${TESTNAME}_${i}_disable.$(etime)" - lctl set_param llite.*.statahead_max=$max - - lctl get_param -n llite.*.statahead_max | grep '[0-9]' - cancel_lru_locks mdc - cancel_lru_locks osc - $LCTL clear - stime=`date +%s` - time ls -l $DIR/$tdir | wc -l - etime=`date +%s` - $LCTL dk $TMP/lustre_${TESTSUITE}_${TESTNAME}_${i}_enable.$(etime) - delta_sa=$((etime - stime)) - log "ls $i files with statahead: $delta_sa sec, dump to $TMP/lustre_${TESTSUITE}_${TESTNAME}_${i}_enable.$(etime)" - lctl get_param -n llite.*.statahead_stats else log "ls $i files is slower with statahead!" fi break + fi fi [ $delta -gt 20 ] && break @@ -5236,7 +5423,7 @@ run_test 123a "verify statahead work" test_123b () { # statahead(bug 15027) mkdir -p $DIR/$tdir createmany -o $DIR/$tdir/$tfile-%d 1000 - + cancel_lru_locks mdc cancel_lru_locks osc @@ -5304,7 +5491,7 @@ test_124a() { log "LVF=$LVF" local OLD_LVF=`lctl get_param -n $NSDIR.pool.lock_volume_factor` lctl set_param -n $NSDIR.pool.lock_volume_factor $LVF - + # Let's make sure that we really have some margin. Client checks # cached locks every 10 sec. SLEEP=$((SLEEP+20)) @@ -5426,7 +5613,7 @@ run_test 125 "don't return EPROTO when a dir has a non-default striping and ACLs test_126() { # bug 12829/13455 [ -z "$(lctl get_param -n llite.*.client_type | grep local)" ] && skip "must run as local client" && return - [ "$UID" != 0 ] && echo "skipping $TESTNAME (must run as root)" && return + [ "$UID" != 0 ] && skip_env "skipping $TESTNAME (must run as root)" && return $GSS && skip "must run as gss disabled" && return $RUNAS -u 0 -g 1 touch $DIR/$tfile || error "touch failed" @@ -5449,7 +5636,7 @@ test_127() { # bug 15521 echo "got $COUNT $NAME" [ ! $MIN ] && error "Missing min value for $NAME proc entry" eval $NAME=$COUNT || error "Wrong proc format" - + case $NAME in read_bytes|write_bytes) [ $MIN -lt 4096 ] && error "min is too small: $MIN" @@ -5583,7 +5770,7 @@ test_130a() { run_test 130a "FIEMAP (1-stripe file)" test_130b() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping FIEMAP on 2-stripe file test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping FIEMAP on 2-stripe file test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -5632,7 +5819,7 @@ test_130b() { run_test 130b "FIEMAP (2-stripe file)" test_130c() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping FIEMAP on 2-stripe file with hole test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping FIEMAP on 2-stripe file with hole test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -5687,7 +5874,7 @@ test_130c() { run_test 130c "FIEMAP (2-stripe file with hole)" test_130d() { - [ "$OSTCOUNT" -lt "3" ] && skip "skipping FIEMAP on N-stripe file test" && return + [ "$OSTCOUNT" -lt "3" ] && skip_env "skipping FIEMAP on N-stripe file test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -5736,7 +5923,7 @@ test_130d() { run_test 130d "FIEMAP (N-stripe file)" test_130e() { - [ "$OSTCOUNT" -lt "2" ] && skip "skipping continuation FIEMAP test" && return + [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping continuation FIEMAP test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -5744,16 +5931,16 @@ test_130e() { trap cleanup_130 EXIT RETURN local fm_file=$DIR/$tfile - lfs setstripe -s 65536 -c 2 $fm_file || error "setstripe failed on $fm_file" + lfs setstripe -s 131072 -c 2 $fm_file || error "setstripe failed on $fm_file" NUM_BLKS=512 - EXPECTED_LEN=$(( (NUM_BLKS / 2) * 4 )) + EXPECTED_LEN=$(( (NUM_BLKS / 2) * 64 )) for ((i = 0; i < $NUM_BLKS; i++)) do - dd if=/dev/zero of=$fm_file count=1 bs=4096 seek=$((2*$i)) conv=notrunc > /dev/null 2>&1 + dd if=/dev/zero of=$fm_file count=1 bs=64k seek=$((2*$i)) conv=notrunc > /dev/null 2>&1 done filefrag -ves $fm_file || error "filefrag $fm_file failed" - filefrag_op=`filefrag -ve $fm_file | grep -A 750 "ext:" | grep -v "ext:" | grep -v "found"` + filefrag_op=`filefrag -ve $fm_file | grep -A 12000 "ext:" | grep -v "ext:" | grep -v "found"` last_lun=`echo $filefrag_op | cut -d: -f5` @@ -5832,12 +6019,80 @@ test_131e() { } run_test 131e "test read hitting hole" +get_ost_param() { + local token=$1 + local gl_sum=0 + for node in $(osts_nodes); do + gl=$(do_node $node "$LCTL get_param -n ost.OSS.ost.stats" | awk '/'$token'/ {print $2}' | head -n 1) + [ x$gl = x"" ] && gl=0 + gl_sum=$((gl_sum + gl)) + done + echo $gl +} + +som_mode_switch() { + local som=$1 + local gl1=$2 + local gl2=$3 + + if [ x$som = x"enabled" ]; then + [ $((gl2 - gl1)) -gt 0 ] && error "no glimpse RPC is expected" + do_facet mgs "$LCTL conf_param $FSNAME.mdt.som=disabled" + else + [ $((gl2 - gl1)) -gt 0 ] || error "some glimpse RPC is expected" + do_facet mgs "$LCTL conf_param $FSNAME.mdt.som=enabled" + fi + + # do remount to make new mount-conf parameters actual + echo remounting... + sync + stopall + setupall +} + +test_132() { #1028, SOM + local num=$(get_mds_dir $DIR) + local mymds=mds${num} + + dd if=/dev/zero of=$DIR/$tfile count=1 2>/dev/null + cancel_lru_locks osc + + som1=$(do_facet $mymds "$LCTL get_param mdt.*.som" | awk -F= ' {print $2}' | head -n 1) + + gl1=$(get_ost_param "ldlm_glimpse_enqueue") + stat $DIR/$tfile >/dev/null + gl2=$(get_ost_param "ldlm_glimpse_enqueue") + echo "====> SOM is "$som1", "$((gl2 - gl1))" glimpse RPC occured" + rm $DIR/$tfile + som_mode_switch $som1 $gl1 $gl2 + + dd if=/dev/zero of=$DIR/$tfile count=1 2>/dev/null + cancel_lru_locks osc + + som2=$(do_facet $mymds "$LCTL get_param mdt.*.som" | awk -F= ' {print $2}' | head -n 1) + if [ $som1 == $som2 ]; then + error "som is still "$som2 + if [ x$som2 = x"enabled" ]; then + som2="disabled" + else + som2="enabled" + fi + fi + + gl1=$(get_ost_param "ldlm_glimpse_enqueue") + stat $DIR/$tfile >/dev/null + gl2=$(get_ost_param "ldlm_glimpse_enqueue") + echo "SOM is "$som2", "$((gl2 - gl1))" glimpse RPC occured" + som_mode_switch $som2 $gl1 $gl2 +} +run_test 132 "som avoids glimpse rpc" + test_140() { #bug-17379 mkdir -p $DIR/$tdir || error "Creating dir $DIR/$tdir" cd $DIR/$tdir || error "Changing to $DIR/$tdir" cp /usr/bin/stat . || error "Copying stat to $DIR/$tdir" - # VFS limits max symlink depth to 5(4KSTACK) or 8 + # VFS limits max symlink depth to 5(4KSTACK) or 7(8KSTACK) or 8 local i=0 while i=`expr $i + 1`; do mkdir -p $i || error "Creating dir $i" @@ -5858,7 +6113,7 @@ test_140() { #bug-17379 done i=`expr $i - 1` echo "The symlink depth = $i" - [ $i -eq 4 -o $i -eq 8 ] || error "Invalid symlink depth" + [ $i -eq 5 -o $i -eq 7 -o $i -eq 8 ] || error "Invalid symlink depth" } run_test 140 "Check reasonable stack depth (shouldn't LBUG) ====" @@ -5870,6 +6125,7 @@ test_150() { cancel_lru_locks osc cmp $TF $DIR/$tfile || error "$TMP/$tfile $DIR/$tfile differ" remount_client $MOUNT + df -P $MOUNT cmp $TF $DIR/$tfile || error "$TF $DIR/$tfile differ (remount)" $TRUNCATE $TF 6000 @@ -5892,77 +6148,86 @@ test_150() { } run_test 150 "truncate/append tests" -function roc_access() { - ACCNUM=`$LCTL get_param -n obdfilter.*.stats | \ - grep 'cache_access'| awk '{print $2}' | \ - awk '{sum=sum+$3} END{print sum}'` - echo $ACCNUM +function roc_hit() { + local list=$(comma_list $(osts_nodes)) + + ACCNUM=$(do_nodes $list $LCTL get_param -n obdfilter.*.stats | \ + awk '/'cache_hit'/ {sum+=$2} END {print sum}') + echo $ACCNUM } -function roc_hit() { - ACCNUM=`$LCTL get_param -n obdfilter.*.stats | \ - grep 'cache_hit'|awk '{print $2}' | \ - awk '{sum=sum+$1} END{print sum}'` - echo $ACCNUM +function set_cache() { + local on=1 + + if [ "$2" == "off" ]; then + on=0; + fi + local list=$(comma_list $(osts_nodes)) + do_nodes $list lctl set_param obdfilter.*.${1}_cache_enable $on + + cancel_lru_locks osc } test_151() { - local CPAGES=3 + remote_ost_nodsh && skip "remote OST with nodsh" && return - # check whether obdfilter is cache capable at all - if ! $LCTL get_param -n obdfilter.*.read_cache_enable; then - echo "not cache-capable obdfilter" - return 0 - fi + local CPAGES=3 + local list=$(comma_list $(osts_nodes)) - # check cache is enabled on all obdfilters - if $LCTL get_param -n obdfilter.*.read_cache_enable | grep 0 >&/dev/null; then - echo "oss cache is disabled" - return 0 - fi + # check whether obdfilter is cache capable at all + if ! do_nodes $list $LCTL get_param -n obdfilter.*.read_cache_enable > /dev/null; then + echo "not cache-capable obdfilter" + return 0 + fi - $LCTL set_param -n obdfilter.*.writethrough_cache_enable 1 + # check cache is enabled on all obdfilters + if do_nodes $list $LCTL get_param -n obdfilter.*.read_cache_enable | grep 0 >&/dev/null; then + echo "oss cache is disabled" + return 0 + fi - # pages should be in the case right after write - dd if=/dev/urandom of=$DIR/$tfile bs=4k count=$CPAGES || error "dd failed" - local BEFORE=`roc_hit` - cancel_lru_locks osc - cat $DIR/$tfile >/dev/null - local AFTER=`roc_hit` - if ! let "AFTER - BEFORE == CPAGES"; then - error "NOT IN CACHE: before: $BEFORE, after: $AFTER" - fi + do_nodes $list $LCTL set_param -n obdfilter.*.writethrough_cache_enable 1 - # the following read invalidates the cache - cancel_lru_locks osc - $LCTL set_param -n obdfilter.*.read_cache_enable 0 - cat $DIR/$tfile >/dev/null + # pages should be in the case right after write + dd if=/dev/urandom of=$DIR/$tfile bs=4k count=$CPAGES || error "dd failed" + local BEFORE=`roc_hit` + cancel_lru_locks osc + cat $DIR/$tfile >/dev/null + local AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + fi - # now data shouldn't be found in the cache - BEFORE=`roc_hit` - cancel_lru_locks osc - cat $DIR/$tfile >/dev/null - AFTER=`roc_hit` - if let "AFTER - BEFORE != 0"; then - error "IN CACHE: before: $BEFORE, after: $AFTER" - fi + # the following read invalidates the cache + cancel_lru_locks osc + do_nodes $list $LCTL set_param -n obdfilter.*.read_cache_enable 0 + cat $DIR/$tfile >/dev/null - $LCTL set_param -n obdfilter.*.read_cache_enable 1 - rm -f $DIR/$tfile + # now data shouldn't be found in the cache + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $DIR/$tfile >/dev/null + AFTER=`roc_hit` + if let "AFTER - BEFORE != 0"; then + error "IN CACHE: before: $BEFORE, after: $AFTER" + fi + + do_nodes $list $LCTL set_param -n obdfilter.*.read_cache_enable 1 + rm -f $DIR/$tfile } run_test 151 "test cache on oss and controls ===============================" test_152() { local TF="$TMP/$tfile" - # simulate ENOMEM during write -#define OBD_FAIL_OST_NOMEM 0x226 + # simulate ENOMEM during write +#define OBD_FAIL_OST_NOMEM 0x226 lctl set_param fail_loc=0x80000226 dd if=/dev/urandom of=$TF bs=6096 count=1 || error "dd failed" cp $TF $DIR/$tfile sync || error "sync failed" lctl set_param fail_loc=0 - + # discard client's cache cancel_lru_locks osc @@ -5971,7 +6236,7 @@ test_152() { cmp $TF $DIR/$tfile || error "cmp failed" lctl set_param fail_loc=0 - rm -f $TF + rm -f $TF } run_test 152 "test read/write with enomem ============================" @@ -5994,6 +6259,210 @@ test_154() { } run_test 154 "Opening a file by FID" +test_155_load() { + local temp=$TMP/$tfile + local file=$DIR/$tfile + local list=$(comma_list $(osts_nodes)) + local big=$(do_nodes $list grep "cache" /proc/cpuinfo | \ + awk '{sum+=$4} END{print sum}') + + log big is $big K + + dd if=/dev/urandom of=$temp bs=6096 count=1 || \ + error "dd of=$temp bs=6096 count=1 failed" + cp $temp $file + cancel_lru_locks osc + cmp $temp $file || error "$temp $file differ" + + $TRUNCATE $temp 6000 + $TRUNCATE $file 6000 + cmp $temp $file || error "$temp $file differ (truncate1)" + + echo "12345" >>$temp + echo "12345" >>$file + cmp $temp $file || error "$temp $file differ (append1)" + + echo "12345" >>$temp + echo "12345" >>$file + cmp $temp $file || error "$temp $file differ (append2)" + + dd if=/dev/urandom of=$temp bs=$((big*2)) count=1k || \ + error "dd of=$temp bs=$((big*2)) count=1k failed" + cp $temp $file + ls -lh $temp $file + cancel_lru_locks osc + cmp $temp $file || error "$temp $file differ" + + rm -f $temp + true +} + +test_155a() { + set_cache read on + set_cache writethrough on + test_155_load +} +run_test 155a "Verification of correctness: read cache:on write_cache:on" + +test_155b() { + set_cache read on + set_cache writethrough off + test_155_load +} +run_test 155b "Verification of correctness: read cache:on write_cache:off" + +test_155c() { + set_cache read off + set_cache writethrough on + test_155_load +} +run_test 155c "Verification of correctness: read cache:off write_cache:on" + +test_155d() { + set_cache read off + set_cache writethrough off + test_155_load +} +run_test 155d "Verification of correctness: read cache:off write_cache:off " + +test_156() { + local CPAGES=3 + local BEFORE + local AFTER + local file="$DIR/$tfile" + + log "Turn on read and write cache" + set_cache read on + set_cache writethrough on + + log "Write data and read it back." + log "Read should be satisfied from the cache." + dd if=/dev/urandom of=$file bs=4k count=$CPAGES || error "dd failed" + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + log "Read again; it should be satisfied from the cache." + BEFORE=$AFTER + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + + log "Turn off the read cache and turn on the write cache" + set_cache read off + set_cache writethrough on + + log "Read again; it should be satisfied from the cache." + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + log "Read again; it should not be satisfied from the cache." + BEFORE=$AFTER + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == 0"; then + error "IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + log "Write data and read it back." + log "Read should be satisfied from the cache." + dd if=/dev/urandom of=$file bs=4k count=$CPAGES || error "dd failed" + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + log "Read again; it should not be satisfied from the cache." + BEFORE=$AFTER + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == 0"; then + error "IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + + log "Turn off read and write cache" + set_cache read off + set_cache writethrough off + + log "Write data and read it back" + log "It should not be satisfied from the cache." + rm -f $file + dd if=/dev/urandom of=$file bs=4k count=$CPAGES || error "dd failed" + cancel_lru_locks osc + BEFORE=`roc_hit` + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == 0"; then + error_ignore 20762 "IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + + log "Turn on the read cache and turn off the write cache" + set_cache read on + set_cache writethrough off + + log "Write data and read it back" + log "It should not be satisfied from the cache." + rm -f $file + dd if=/dev/urandom of=$file bs=4k count=$CPAGES || error "dd failed" + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == 0"; then + error_ignore 20762 "IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + log "Read again; it should be satisfied from the cache." + BEFORE=`roc_hit` + cancel_lru_locks osc + cat $file >/dev/null + AFTER=`roc_hit` + if ! let "AFTER - BEFORE == CPAGES"; then + error "NOT IN CACHE: before: $BEFORE, after: $AFTER" + else + log "cache hits:: before: $BEFORE, after: $AFTER" + fi + + rm -f $file +} +run_test 156 "Verification of tunables ============================" + #Changelogs err17935 () { if [ $MDSCOUNT -gt 1 ]; then @@ -6030,20 +6499,20 @@ test_160() { # verify contents echo "verifying target fid" fidc=$($LFS changelog $MDT0 | grep timestamp | grep "CREAT" | \ - tail -1 | awk '{print $5}') + tail -1 | awk '{print $6}') fidf=$($LFS path2fid $DIR/$tdir/pics/zach/timestamp) [ "$fidc" == "t=$fidf" ] || \ err17935 "fid in changelog $fidc != file fid $fidf" echo "verifying parent fid" fidc=$($LFS changelog $MDT0 | grep timestamp | grep "CREAT" | \ - tail -1 | awk '{print $6}') + tail -1 | awk '{print $7}') fidf=$($LFS path2fid $DIR/$tdir/pics/zach) [ "$fidc" == "p=$fidf" ] || \ - err17935 "pfid in changelog $fidc != dir fid $fidf" + err17935 "pfid in changelog $fidc != dir fid $fidf" USER_REC1=$(do_facet $SINGLEMDS lctl get_param -n \ mdd.$MDT0.changelog_users | grep $USER | awk '{print $2}') - $LFS changelog_clear $MDT0 $USER $(($USER_REC1 + 5)) + $LFS changelog_clear $MDT0 $USER $(($USER_REC1 + 5)) USER_REC2=$(do_facet $SINGLEMDS lctl get_param -n \ mdd.$MDT0.changelog_users | grep $USER | awk '{print $2}') echo "verifying user clear: $(( $USER_REC1 + 5 )) == $USER_REC2" @@ -6079,9 +6548,6 @@ test_160() { run_test 160 "changelog sanity" test_161() { - # need local MDT for fid2path - remote_mds && skip "remote MDS" && return - mkdir -p $DIR/$tdir cp /etc/hosts $DIR/$tdir/$tfile mkdir $DIR/$tdir/foo1 @@ -6091,8 +6557,8 @@ test_161() { ln $DIR/$tdir/$tfile $DIR/$tdir/foo1/luna ln $DIR/$tdir/$tfile $DIR/$tdir/foo2/thor local FID=$($LFS path2fid $DIR/$tdir/$tfile | tr -d '[') - if [ "$($LFS fid2path ${mds1_svc} $FID | wc -l)" != "5" ]; then - $LFS fid2path ${mds1_svc} $FID + if [ "$($LFS fid2path $DIR $FID | wc -l)" != "5" ]; then + $LFS fid2path $DIR $FID err17935 "bad link ea" fi # middle @@ -6103,9 +6569,9 @@ test_161() { rm $DIR/$tdir/$tfile # rename mv $DIR/$tdir/foo1/sofia $DIR/$tdir/foo2/maggie - if [ "$($LFS fid2path ${mds1_svc} --link 1 $FID)" != "/$tdir/foo2/maggie" ] + if [ "$($LFS fid2path $DIR --link 1 $FID)" != "/$tdir/foo2/maggie" ] then - $LFS fid2path ${mds1_svc} $FID + $LFS fid2path $DIR $FID err17935 "bad link rename" fi rm $DIR/$tdir/foo2/maggie @@ -6114,11 +6580,11 @@ test_161() { local longname=filename_avg_len_is_thirty_two_ createmany -l$DIR/$tdir/foo1/luna $DIR/$tdir/foo2/$longname 1000 || \ error "failed to hardlink many files" - links=$($LFS fid2path ${mds1_svc} $FID | wc -l) + links=$($LFS fid2path $DIR $FID | wc -l) echo -n "${links}/1000 links in link EA" [ ${links} -gt 60 ] || err17935 "expected at least 60 links in link EA" unlinkmany $DIR/$tdir/foo2/$longname 1000 || \ - error "failed to unlink many hardlinks" + error "failed to unlink many hardlinks" } run_test 161 "link ea sanity" @@ -6141,9 +6607,6 @@ check_path() { } test_162() { - # need local MDT for fid2path - remote_mds && skip "remote MDS" && return - # Make changes to filesystem mkdir -p $DIR/$tdir/d2 touch $DIR/$tdir/d2/$tfile @@ -6151,25 +6614,50 @@ test_162() { touch $DIR/$tdir/d2/x2 mkdir -p $DIR/$tdir/d2/a/b/c mkdir -p $DIR/$tdir/d2/p/q/r + # regular file FID=$($LFS path2fid $DIR/$tdir/d2/$tfile | tr -d '[') - check_path "/$tdir/d2/$tfile" ${mds1_svc} $FID --link 0 + check_path "/$tdir/d2/$tfile" $DIR $FID --link 0 + + # softlink + ln -s $DIR/$tdir/d2/$tfile $DIR/$tdir/d2/p/q/r/slink + FID=$($LFS path2fid $DIR/$tdir/d2/p/q/r/slink | tr -d '[') + check_path "/$tdir/d2/p/q/r/slink" $DIR $FID --link 0 + + # hardlink ln $DIR/$tdir/d2/$tfile $DIR/$tdir/d2/p/q/r/hlink mv $DIR/$tdir/d2/$tfile $DIR/$tdir/d2/a/b/c/new_file FID=$($LFS path2fid $DIR/$tdir/d2/a/b/c/new_file | tr -d '[') - check_path "/$tdir/d2/a/b/c/new_file" ${mds1_svc} $FID --link 1 - check_path "/$tdir/d2/p/q/r/hlink" ${mds1_svc} $FID --link 0 - # check that there are 2 links - ${LFS} fid2path ${mds1_svc} $FID | wc -l | grep -q 2 || \ - err17935 "expected 2 links" + # fid2path dir/fsname should both work + check_path "/$tdir/d2/a/b/c/new_file" $FSNAME $FID --link 1 + check_path "/$tdir/d2/p/q/r/hlink" $DIR $FID --link 0 + # hardlink count: check that there are 2 links + # Doesnt work with CMD yet: 17935 + ${LFS} fid2path $DIR $FID | wc -l | grep -q 2 || \ + err17935 "expected 2 links" + + # hardlink indexing: remove the first link rm $DIR/$tdir/d2/p/q/r/hlink - check_path "/$tdir/d2/a/b/c/new_file" ${mds1_svc} $FID --link 0 - # Doesnt work with CMD yet: 17935 - return 0 + check_path "/$tdir/d2/a/b/c/new_file" $DIR $FID --link 0 + + return 0 } run_test 162 "path lookup sanity" -test_154() { +test_163() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return + copytool --test $FSNAME || { skip "copytool not runnable: $?" && return; } + copytool $FSNAME & + sleep 1 + local uuid=$($LCTL get_param -n mdc.${FSNAME}-MDT0000-mdc-*.uuid) + # this proc file is temporary and linux-only + do_facet mds lctl set_param mdt.${FSNAME}-MDT0000.mdccomm=$uuid ||\ + error "kernel->userspace send failed" + kill -INT $! +} +run_test 163 "kernel <-> userspace comms" + +test_169() { # do directio so as not to populate the page cache log "creating a 10 Mb file" multiop $DIR/$tfile oO_CREAT:O_DIRECT:O_RDWR:w$((10*1048576))c || error "multiop failed while creating a file" @@ -6184,7 +6672,7 @@ test_154() { log "removing the temporary file" rm -rf $DIR/$tfile || error "tmp file removal failed" } -run_test 154 "parallel read and truncate should not deadlock ===" +run_test 169 "parallel read and truncate should not deadlock" test_170() { $LCTL clear # bug 18514 @@ -6207,36 +6695,116 @@ test_170() { $LCTL df $TMP/${tfile}_log_good > $TMP/${tfile}_log_good.out 2>&1 local good_line2=$(tail -n 1 $TMP/${tfile}_log_good.out | awk '{print $5}') - [ "$bad_line" ] && [ "$good_line1" ] && [ "$good_line2" ] || + [ "$bad_line" ] && [ "$good_line1" ] && [ "$good_line2" ] || error "bad_line good_line1 good_line2 are empty" - + + cat $TMP/${tfile}_log_good >> $TMP/${tfile}_logs_corrupt + cat $TMP/${tfile}_log_bad >> $TMP/${tfile}_logs_corrupt cat $TMP/${tfile}_log_good >> $TMP/${tfile}_logs_corrupt - cat $TMP/${tfile}_log_bad >> $TMP/${tfile}_logs_corrupt - cat $TMP/${tfile}_log_good >> $TMP/${tfile}_logs_corrupt $LCTL df $TMP/${tfile}_logs_corrupt > $TMP/${tfile}_log_bad.out 2>&1 local bad_line_new=$(tail -n 1 $TMP/${tfile}_log_bad.out | awk '{print $9}') local good_line_new=$(tail -n 1 $TMP/${tfile}_log_bad.out | awk '{print $5}') - [ "$bad_line_new" ] && [ "$good_line_new" ] || + [ "$bad_line_new" ] && [ "$good_line_new" ] || error "bad_line_new good_line_new are empty" - + local expected_good=$((good_line1 + good_line2*2)) rm -f $TMP/${tfile}* if [ $bad_line -ne $bad_line_new ]; then error "expected $bad_line bad lines, but got $bad_line_new" - return 1 + return 1 fi if [ $expected_good -ne $good_line_new ]; then error "expected $expected_good good lines, but got $good_line_new" - return 2 + return 2 fi true } run_test 170 "test lctl df to handle corrupted log =====================" +test_171() { # bug20592 +#define OBD_FAIL_PTLRPC_DUMP_LOG 0x50e + $LCTL set_param fail_loc=0x50e + $LCTL set_param fail_val=3000 + multiop_bg_pause $DIR/$tfile Os || true + # cause log dump + sleep 3 + if dmesg | grep "recursive fault"; then + error "caught a recursive fault" + fi + $LCTL set_param fail_loc=0 + true +} +run_test 171 "test libcfs_debug_dumplog_thread stuck in do_exit() ======" + +# it would be good to share it with obdfilter-survey/libecho code +setup_obdecho_osc () { + local rc=0 + local ost_nid=$1 + local obdfilter_name=$2 + [ $rc -eq 0 ] && { $LCTL attach osc ${obdfilter_name}_osc \ + ${obdfilter_name}_osc_UUID || rc=2; } + [ $rc -eq 0 ] && { $LCTL --device ${obdfilter_name}_osc setup \ + ${obdfilter_name}_UUID $ost_nid || rc=3; } + return $rc +} + +cleaup_obdecho_osc () { + local obdfilter_name=$1 + $LCTL --device ${obdfilter_name}_osc cleanup >/dev/null + $LCTL --device ${obdfilter_name}_osc detach >/dev/null + return 0 +} + +obdecho_create_test() { + local OBD=$1 + local node=$2 + local rc=0 + do_facet $node "$LCTL attach echo_client ec ec_uuid" || rc=1 + [ $rc -eq 0 ] && { do_facet $node "$LCTL --device ec setup $OBD" || \ + rc=2; } + [ $rc -eq 0 ] && { do_facet $node "$LCTL --device ec create 1" || \ + rc=3; } + [ $rc -eq 0 ] && { do_facet $node "$LCTL --device ec test_brw 0 w 1" ||\ + rc=4; } + [ $rc -eq 0 -o $rc -gt 2 ] && { do_facet $node "$LCTL --device ec " \ + "cleanup" || rc=5; } + [ $rc -eq 0 -o $rc -gt 1 ] && { do_facet $node "$LCTL --device ec " \ + "detach" || rc=6; } + return $rc +} + +test_180() { + local rc=0 + local rmmod_local=0 + local rmmod_remote=0 + + lsmod | grep -q obdecho || \ + { load_module obdecho/obdecho && rmmod_local=1; } + OBD=$($LCTL dl | grep -v mdt | grep osc | awk '{print $4;exit}') + HOST=$($LCTL dl -t | grep -v mdt | grep osc | awk '{print $7;exit}') + OBD=`echo $OBD | sed 's/-osc-.*$//'` + [ "x$OBD" != "x" ] && { setup_obdecho_osc $HOST $OBD || rc=1; } || rc=1 + [ $rc -eq 0 ] && { obdecho_create_test ${OBD}_osc client || rc=2; } + [ "x$OBD" != "x" ] && cleaup_obdecho_osc $OBD + [ $rmmod_local -eq 1 ] && rmmod obdecho + [ $rc -eq 0 ] || return $rc + + do_facet ost "lsmod | grep -q obdecho || " \ + "{ insmod ${LUSTRE}/obdecho/obdecho.ko || " \ + "modprobe obdecho; }" && rmmod_remote=1 + OBD=$(do_facet ost $LCTL dl | awk '/obdfilter/ {print $4;exit}') + [ "x$OBD" != "x" ] && { obdecho_create_test $OBD ost || rc=3; } + [ $rmmod_remote -eq 1 ] && do_facet ost "rmmod obdecho" + [ $rc -eq 0 ] || return $rc + + true +} +run_test 180 "test obdecho ============================================" + # OST pools tests POOL=${POOL:-cea1} TGT_COUNT=$OSTCOUNT @@ -6266,20 +6834,27 @@ check_file_in_pool() return 0 } +trap "cleanup_pools $FSNAME" EXIT + test_200a() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return - do_facet mgs $LCTL pool_new $FSNAME.$POOL - # get param should return err until pool is created - wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL 2>/dev/null || echo foo" "" || error "Pool creation of $POOL failed" + create_pool $FSNAME.$POOL || return $? + [ $($LFS pool_list $FSNAME | grep -c $POOL) -eq 1 ] || + error "$POOL not in lfs pool_list" } run_test 200a "Create new pool ==========================================" test_200b() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return - TGT=$(for i in `seq $TGTPOOL_FIRST $TGTPOOL_STEP $TGTPOOL_MAX`; do printf "$FSNAME-OST%04x_UUID " $i; done) + TGT=$(for i in $TGTPOOL_LIST; do printf "$FSNAME-OST%04x_UUID " $i; done) do_facet mgs $LCTL pool_add $FSNAME.$POOL \ $FSNAME-OST[$TGTPOOL_FIRST-$TGTPOOL_MAX/$TGTPOOL_STEP] - wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL | sort -u | tr '\n' ' ' " "$TGT" || error "Add to pool failed" + wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL | sort -u | tr '\n' ' ' " "$TGT" || + error "Add to pool failed" + local lfscount=$($LFS pool_list $FSNAME.$POOL | grep -c "\-OST") + local addcount=$((($TGTPOOL_MAX - $TGTPOOL_FIRST) / $TGTPOOL_STEP + 1)) + [ $lfscount -eq $addcount ] || + error "lfs pool_list bad ost count $lfscount != $addcount" } run_test 200b "Add targets to a pool ====================================" @@ -6293,8 +6868,8 @@ run_test 200c "Set pool on a directory =================================" test_200d() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return - res=$($GETSTRIPE $POOL_DIR | grep pool: | cut -f8 -d " ") - [ "$res" = $POOL ] || error "Pool on $POOL_DIR is not $POOL" + res=$($GETSTRIPE --pool $POOL_DIR | awk '/^pool:/ {print $2}') + [ "$res" = $POOL ] || error "Pool on $POOL_DIR is $res, not $POOL" } run_test 200d "Check pool on a directory ===============================" @@ -6335,33 +6910,60 @@ run_test 200f "Create files in a pool ===================================" test_200g() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return + TGT=$($LCTL get_param -n lov.$FSNAME-clilov-*.pools.$POOL | tr '\n' ' ') + res=$($LFS df --pool $FSNAME.$POOL | awk '{print $1}' | grep "$FSNAME-OST" | tr '\n' ' ') + [ "$res" = "$TGT" ] || error "Pools OSTs '$TGT' is not '$res' that lfs df reports" +} +run_test 200g "lfs df a pool ============================================" + +test_201a() { + remote_mgs_nodsh && skip "remote MGS with nodsh" && return TGT=$($LCTL get_param -n lov.$FSNAME-*.pools.$POOL | head -1) do_facet mgs $LCTL pool_remove $FSNAME.$POOL $TGT - wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL | grep $TGT" "" || error "$TGT not removed from $FSNAME.$POOL" + wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL | grep $TGT" "" || + error "$TGT not removed from $FSNAME.$POOL" } -run_test 200g "Remove a target from a pool =============================" +run_test 201a "Remove a target from a pool =============================" -test_200h() { +test_201b() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return for TGT in $($LCTL get_param -n lov.$FSNAME-*.pools.$POOL | sort -u) do do_facet mgs $LCTL pool_remove $FSNAME.$POOL $TGT done - wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL" ""\ - || error "Pool $FSNAME.$POOL cannot be drained" - # striping on an empty pool should fall back to "pool of everything" - $SETSTRIPE -p $POOL ${POOL_FILE}/$tfile || error "failed to create file with empty pool" + wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL" "" || + error "Pool $FSNAME.$POOL cannot be drained" + # striping on an empty/nonexistant pool should fall back to "pool of everything" + touch ${POOL_DIR}/$tfile || error "failed to use fallback striping for empty pool" + # setstripe on an empty pool should fail + $SETSTRIPE -p $POOL ${POOL_FILE}/$tfile 2>/dev/null && \ + error "expected failure when creating file with empty pool" + return 0 } -run_test 200h "Remove all targets from a pool ==========================" +run_test 201b "Remove all targets from a pool ==========================" -test_200i() { +test_201c() { remote_mgs_nodsh && skip "remote MGS with nodsh" && return do_facet mgs $LCTL pool_destroy $FSNAME.$POOL + + sleep 2 + # striping on an empty/nonexistant pool should fall back to "pool of everything" + touch ${POOL_DIR}/$tfile || error "failed to use fallback striping for missing pool" + # setstripe on an empty pool should fail + $SETSTRIPE -p $POOL ${POOL_FILE}/$tfile 2>/dev/null && \ + error "expected failure when creating file with missing pool" + # get param should return err once pool is gone - wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL 2>/dev/null || echo foo" "foo" && return 0 + if wait_update $HOSTNAME "lctl get_param -n lov.$FSNAME-*.pools.$POOL 2>/dev/null || + echo foo" "foo"; then + remove_pool_from_list $FSNAME.$POOL + return 0 + fi error "Pool $FSNAME.$POOL is not destroyed" } -run_test 200i "Remove a pool ============================================" +run_test 201c "Remove a pool ============================================" + +cleanup_pools $FSNAME test_212() { size=`date +%s` @@ -6383,6 +6985,184 @@ test_213() { } run_test 213 "OSC lock completion and cancel race don't crash - bug 18829" +test_214() { # for bug 20133 + mkdir -p $DIR/d214p/d214c + for (( i=0; i < 340; i++ )) ; do + touch $DIR/d214p/d214c/a$i + done + + ls -l $DIR/d214p || error "ls -l $DIR/d214p failed" + mv $DIR/d214p/d214c $DIR/ || error "mv $DIR/d214p/d214c $DIR/ failed" + ls $DIR/d214c || error "ls $DIR/d214c failed" + rm -rf $DIR/d214* || error "rm -rf $DIR/d214* failed" +} +run_test 214 "hash-indexed directory test - bug 20133" + +# having "abc" as 1st arg, creates $TMP/lnet_abc.out and $TMP/lnet_abc.sys +create_lnet_proc_files() { + cat /proc/sys/lnet/$1 >$TMP/lnet_$1.out || error "cannot read /proc/sys/lnet/$1" + sysctl lnet.$1 >$TMP/lnet_$1.sys_tmp || error "cannot read lnet.$1" + + sed "s/^lnet.$1\ =\ //g" "$TMP/lnet_$1.sys_tmp" >$TMP/lnet_$1.sys + rm -f "$TMP/lnet_$1.sys_tmp" +} + +# counterpart of create_lnet_proc_files +remove_lnet_proc_files() { + rm -f $TMP/lnet_$1.out $TMP/lnet_$1.sys +} + +# uses 1st arg as trailing part of filename, 2nd arg as description for reports, +# 3rd arg as regexp for body +check_lnet_proc_stats() { + local l=$(cat "$TMP/lnet_$1" |wc -l) + [ $l = 1 ] || (cat "$TMP/lnet_$1" && error "$2 is not of 1 line: $l") + + grep -E "$3" "$TMP/lnet_$1" || (cat "$TMP/lnet_$1" && error "$2 misformatted") +} + +# uses 1st arg as trailing part of filename, 2nd arg as description for reports, +# 3rd arg as regexp for body, 4th arg as regexp for 1st line, 5th arg is +# optional and can be regexp for 2nd line (lnet.routes case) +check_lnet_proc_entry() { + local blp=2 # blp stands for 'position of 1st line of body' + [ "$5" = "" ] || blp=3 # lnet.routes case + + local l=$(cat "$TMP/lnet_$1" |wc -l) + # subtracting one from $blp because the body can be empty + [ "$l" -ge "$(($blp - 1))" ] || (cat "$TMP/lnet_$1" && error "$2 is too short: $l") + + sed -n '1 p' "$TMP/lnet_$1" |grep -E "$4" >/dev/null || + (cat "$TMP/lnet_$1" && error "1st line of $2 misformatted") + + [ "$5" = "" ] || sed -n '2 p' "$TMP/lnet_$1" |grep -E "$5" >/dev/null || + (cat "$TMP/lnet_$1" && error "2nd line of $2 misformatted") + + # bail out if any unexpected line happened + sed -n "$blp~1 p" "$TMP/lnet_$1" |grep -Ev "$3" + [ "$?" != 0 ] || error "$2 misformatted" +} + +test_215() { # for bugs 18102, 21079, 21517 + local N='(0|[1-9][0-9]*)' # non-negative numeric + local P='[1-9][0-9]*' # positive numeric + local I='(0|-?[1-9][0-9]*)' # any numeric (0 | >0 | <0) + local NET='[a-z][a-z0-9]*' # LNET net like o2ib2 + local ADDR='[0-9.]+' # LNET addr like 10.0.0.1 + local NID="$ADDR@$NET" # LNET nid like 10.0.0.1@o2ib2 + + local L1 # regexp for 1st line + local L2 # regexp for 2nd line (optional) + local BR # regexp for the rest (body) + + # /proc/sys/lnet/stats should look as 11 space-separated non-negative numerics + BR="^$N $N $N $N $N $N $N $N $N $N $N$" + create_lnet_proc_files "stats" + check_lnet_proc_stats "stats.out" "/proc/sys/lnet/stats" "$BR" + check_lnet_proc_stats "stats.sys" "lnet.stats" "$BR" + remove_lnet_proc_files "stats" + + # /proc/sys/lnet/routes should look like this: + # Routing disabled/enabled + # net hops state router + # where net is a string like tcp0, hops >= 0, state is up/down, + # router is a string like 192.168.1.1@tcp2 + L1="^Routing (disabled|enabled)$" + L2="^net +hops +state +router$" + BR="^$NET +$N +(up|down) +$NID$" + create_lnet_proc_files "routes" + check_lnet_proc_entry "routes.out" "/proc/sys/lnet/routes" "$BR" "$L1" "$L2" + check_lnet_proc_entry "routes.sys" "lnet.routes" "$BR" "$L1" "$L2" + remove_lnet_proc_files "routes" + + # /proc/sys/lnet/routers should look like this: + # ref rtr_ref alive_cnt state last_ping ping_sent deadline down_ni router + # where ref > 0, rtr_ref > 0, alive_cnt >= 0, state is up/down, + # last_ping >= 0, ping_sent is boolean (0/1), deadline and down_ni are + # numeric (0 or >0 or <0), router is a string like 192.168.1.1@tcp2 + L1="^ref +rtr_ref +alive_cnt +state +last_ping +ping_sent +deadline +down_ni +router$" + BR="^$P +$P +$N +(up|down) +$N +(0|1) +$I +$I +$NID$" + create_lnet_proc_files "routers" + check_lnet_proc_entry "routers.out" "/proc/sys/lnet/routers" "$BR" "$L1" + check_lnet_proc_entry "routers.sys" "lnet.routers" "$BR" "$L1" + remove_lnet_proc_files "routers" + + # /proc/sys/lnet/peers should look like this: + # nid refs state max rtr min tx min queue + # where nid is a string like 192.168.1.1@tcp2, refs > 0, + # state is up/down/NA, max >= 0. rtr, min, tx, min are + # numeric (0 or >0 or <0), queue >= 0. + L1="^nid +refs +state +max +rtr +min +tx +min +queue$" + BR="^$NID +$P +(up|down|NA) +$N +$I +$I +$I +$I +$N$" + create_lnet_proc_files "peers" + check_lnet_proc_entry "peers.out" "/proc/sys/lnet/peers" "$BR" "$L1" + check_lnet_proc_entry "peers.sys" "lnet.peers" "$BR" "$L1" + remove_lnet_proc_files "peers" + + # /proc/sys/lnet/buffers should look like this: + # pages count credits min + # where pages >=0, count >=0, credits and min are numeric (0 or >0 or <0) + L1="^pages +count +credits +min$" + BR="^ +$N +$N +$I +$I$" + create_lnet_proc_files "buffers" + check_lnet_proc_entry "buffers.out" "/proc/sys/lnet/buffers" "$BR" "$L1" + check_lnet_proc_entry "buffers.sys" "lnet.buffers" "$BR" "$L1" + remove_lnet_proc_files "buffers" + + # /proc/sys/lnet/nis should look like this: + # nid status alive refs peer rtr max tx min + # where nid is a string like 192.168.1.1@tcp2, status is up/down, + # alive is numeric (0 or >0 or <0), refs > 0, peer >= 0, + # rtr >= 0, max >=0, tx and min are numeric (0 or >0 or <0). + L1="^nid +status +alive +refs +peer +rtr +max +tx +min$" + BR="^$NID +(up|down) +$I +$P +$N +$N +$N +$I +$I$" + create_lnet_proc_files "nis" + check_lnet_proc_entry "nis.out" "/proc/sys/lnet/nis" "$BR" "$L1" + check_lnet_proc_entry "nis.sys" "lnet.nis" "$BR" "$L1" + remove_lnet_proc_files "nis" + + # can we successfully write to /proc/sys/lnet/stats? + echo "0" >/proc/sys/lnet/stats || error "cannot write to /proc/sys/lnet/stats" + sysctl -w lnet.stats=0 || error "cannot write to lnet.stats" +} +run_test 215 "/proc/sys/lnet exists and has proper content - bugs 18102, 21079, 21517" + +test_216() { # bug 20317 + local node + local p="$TMP/sanityN-$TESTNAME.parameters" + save_lustre_params $HOSTNAME "osc.*.contention_seconds" > $p + for node in $(osts_nodes); do + save_lustre_params $node "ldlm.namespaces.filter-*.max_nolock_bytes" >> $p + save_lustre_params $node "ldlm.namespaces.filter-*.contended_locks" >> $p + save_lustre_params $node "ldlm.namespaces.filter-*.contention_seconds" >> $p + done + clear_osc_stats + + # agressive lockless i/o settings + for node in $(osts_nodes); do + do_node $node 'lctl set_param -n ldlm.namespaces.filter-*.max_nolock_bytes 2000000; lctl set_param -n ldlm.namespaces.filter-*.contended_locks 0; lctl set_param -n ldlm.namespaces.filter-*.contention_seconds 60' + done + lctl set_param -n osc.*.contention_seconds 60 + + $DIRECTIO write $DIR/$tfile 0 10 4096 + $CHECKSTAT -s 40960 $DIR/$tfile + + # disable lockless i/o + for node in $(osts_nodes); do + do_node $node 'lctl set_param -n ldlm.namespaces.filter-*.max_nolock_bytes 0; lctl set_param -n ldlm.namespaces.filter-*.contended_locks 32; lctl set_param -n ldlm.namespaces.filter-*.contention_seconds 0' + done + lctl set_param -n osc.*.contention_seconds 0 + clear_osc_stats + + dd if=/dev/zero of=$DIR/$tfile count=0 + $CHECKSTAT -s 0 $DIR/$tfile + + restore_lustre_params <$p + rm -f $p + rm $DIR/$tfile +} +run_test 216 "check lockless direct write works and updates file size and kms correctly" + # # tests that do cleanup/setup should be run at the end #