X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Ftests%2Fsanity.sh;h=16546255fe167635e7d7482735fe49626eb5848e;hp=f9371d6d73e3fa54cc79f4451da8de228f3b8c2e;hb=e240fb5099af8e62c532d314317095800ebb6864;hpb=bcb95d6b82f4208998201cc12f63fc1074c3003c diff --git a/lustre/tests/sanity.sh b/lustre/tests/sanity.sh index f9371d6..1654625 100755 --- a/lustre/tests/sanity.sh +++ b/lustre/tests/sanity.sh @@ -8,13 +8,13 @@ set -e ONLY=${ONLY:-"$*"} -# bug number for skipped test: 13297 2108 9789 3637 9789 3561 12622 5188 -ALWAYS_EXCEPT=" 42a 42b 42c 42d 45 51d 68b $SANITY_EXCEPT" +# bug number for skipped test: 13297 2108 9789 3637 9789 3561 5188 +ALWAYS_EXCEPT=" 42a 42b 42c 42d 45 68b $SANITY_EXCEPT" # UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT! # with LOD/OSP landing -# bug number for skipped tests: LU-2036 -ALWAYS_EXCEPT=" 76 $ALWAYS_EXCEPT" +# bug number for skipped tests: LU-2036 LU-8139 +ALWAYS_EXCEPT=" 76 101g $ALWAYS_EXCEPT" is_sles11() # LU-4341 { @@ -75,12 +75,14 @@ init_test_env $@ . ${CONFIG:=$LUSTRE/tests/cfg/${NAME}.sh} init_logging -[ "$SLOW" = "no" ] && EXCEPT_SLOW="24o 24D 27m 64b 68 71 77f 78 115 124b 300o" +# 5 12 (min)" +[ "$SLOW" = "no" ] && EXCEPT_SLOW="24D 27m 64b 68 71 115 300o" if [ $(facet_fstype $SINGLEMDS) = "zfs" ]; then - # bug number for skipped test: LU-4536 LU-1957 LU-2805 - ALWAYS_EXCEPT="$ALWAYS_EXCEPT 65ic 180 184c" - [ "$SLOW" = "no" ] && EXCEPT_SLOW="$EXCEPT_SLOW 51b 51ba" + # bug number for skipped test: LU-4536 LU-1957 + ALWAYS_EXCEPT="$ALWAYS_EXCEPT 65ic 180" + # 13 (min)" + [ "$SLOW" = "no" ] && EXCEPT_SLOW="$EXCEPT_SLOW 51b" fi FAIL_ON_ERROR=false @@ -105,7 +107,6 @@ check_swap_layouts_support() } check_and_setup_lustre - DIR=${DIR:-$MOUNT} assert_DIR @@ -263,6 +264,21 @@ test_6g() { test_mkdir $DIR/$tdir/d/subdir || error "mkdir $tdir/d/subdir failed" $CHECKSTAT -g \#$RUNAS_GID $DIR/$tdir/d/subdir || error "$tdir/d/subdir should be GID $RUNAS_GID" + if [[ $MDSCOUNT -gt 1 ]]; then + # check remote dir sgid inherite + $LFS mkdir -i 0 $DIR/$tdir.local || + error "mkdir $tdir.local failed" + chmod g+s $DIR/$tdir.local || + error "chmod $tdir.local failed" + chgrp $RUNAS_GID $DIR/$tdir.local || + error "chgrp $tdir.local failed" + $LFS mkdir -i 1 $DIR/$tdir.local/$tdir.remote || + error "mkdir $tdir.remote failed" + $CHECKSTAT -g \#$RUNAS_GID $DIR/$tdir.local/$tdir.remote || + error "$tdir.remote should be owned by $UID.$RUNAS_ID" + $CHECKSTAT -p 02755 $DIR/$tdir.local/$tdir.remote || + error "$tdir.remote should be mode 02755" + fi } run_test 6g "Is new dir in sgid dir inheriting group?" @@ -1016,7 +1032,9 @@ test_24u() { # bug12192 run_test 24u "create stripe file" page_size() { - getconf PAGE_SIZE + local size + size=$(getconf PAGE_SIZE 2>/dev/null) + echo -n ${size:-4096} } simple_cleanup_common() { @@ -1647,7 +1665,7 @@ test_27u() { # bug 4900 createmany -o $DIR/$tdir/t- 1000 do_nodes $list $LCTL set_param fail_loc=0 - TLOG=$DIR/$tfile.getstripe + TLOG=$TMP/$tfile.getstripe $GETSTRIPE $DIR/$tdir > $TLOG OBJS=$(awk -vobj=0 '($1 == 0) { obj += 1 } END { print obj; }' $TLOG) unlinkmany $DIR/$tdir/t- 1000 @@ -2020,6 +2038,8 @@ run_test 27C "check full striping across all OSTs" test_27D() { [ $OSTCOUNT -lt 2 ] && skip "needs >= 2 OSTs" && return + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return local POOL=${POOL:-testpool} local first_ost=0 local last_ost=$(($OSTCOUNT - 1)) @@ -2030,8 +2050,13 @@ test_27D() { test_mkdir -p $DIR/$tdir pool_add $POOL || error "pool_add failed" pool_add_targets $POOL $ost_range || error "pool_add_targets failed" - llapi_layout_test -d$DIR/$tdir -p$POOL -o$OSTCOUNT || + + local skip27D + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.64) ] && + skip27D = "-s 29" + llapi_layout_test -d$DIR/$tdir -p$POOL -o$OSTCOUNT $skip27D || error "llapi_layout_test failed" + cleanup_pools || error "cleanup_pools failed" } run_test 27D "validate llapi_layout API" @@ -2040,6 +2065,8 @@ run_test 27D "validate llapi_layout API" # accessing a widely striped file. test_27E() { [ $OSTCOUNT -lt 2 ] && skip "needs >= 2 OSTs" && return + [ $(lustre_version_code client) -lt $(version_code 2.5.57) ] && + skip "client does not have LU-3338 fix" && return # 72 bytes is the minimum space required to store striping # information for a file striped across one OST: @@ -2065,6 +2092,46 @@ test_27E() { } run_test 27E "check that default extended attribute size properly increases" +test_27F() { # LU-5346/LU-7975 + + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + + [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.51) ]] && + skip "Need MDS version at least 2.8.51" && return + + test_mkdir -p $DIR/$tdir + rm -f $DIR/$tdir/f0 + $SETSTRIPE -c 2 $DIR/$tdir + + # stop all OSTs to reproduce situation for LU-7975 ticket + for num in $(seq $OSTCOUNT); do + stop ost$num + done + + # open/create f0 with O_LOV_DELAY_CREATE + # truncate f0 to a non-0 size + # close + multiop $DIR/$tdir/f0 oO_RDWR:O_CREAT:O_LOV_DELAY_CREATE:T1050000c + + $CHECKSTAT -s 1050000 $DIR/$tdir/f0 || error "checkstat failed" + # open/write it again to force delayed layout creation + cat /etc/hosts > $DIR/$tdir/f0 & + catpid=$! + + # restart OSTs + for num in $(seq $OSTCOUNT); do + start ost$num $(ostdevname $num) $OST_MOUNT_OPTS || + error "ost$num failed to start" + done + + wait $catpid || error "cat failed" + + cmp /etc/hosts $DIR/$tdir/f0 || error "cmp failed" + [[ $($GETSTRIPE -c $DIR/$tdir/f0) == 2 ]] || error "wrong stripecount" + +} +run_test 27F "Client resend delayed layout creation with non-zero size" + # createtest also checks that device nodes are created and # then visible correctly (#2091) test_28() { # bug 2091 @@ -2074,8 +2141,9 @@ test_28() { # bug 2091 run_test 28 "create/mknod/mkdir with bad file types ============" test_29() { - [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - cancel_lru_locks mdc + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return 0 + sync; sleep 1; sync # flush out any dirty pages from previous tests + cancel_lru_locks test_mkdir $DIR/d29 touch $DIR/d29/foo log 'first d29' @@ -2085,7 +2153,7 @@ test_29() { for lock_count in $(lctl get_param -n ldlm.namespaces.*mdc*.lock_count); do let LOCKCOUNTORIG=$LOCKCOUNTORIG+$lock_count done - [ $LOCKCOUNTORIG -eq 0 ] && echo "No mdc lock count" && return 1 + [ $LOCKCOUNTORIG -eq 0 ] && error "No mdc lock count" && return 1 declare -i LOCKUNUSEDCOUNTORIG=0 for unused_count in $(lctl get_param -n ldlm.namespaces.*mdc*.lock_unused_count); do @@ -2356,8 +2424,13 @@ test_31p() { run_test 31p "remove of open striped directory" cleanup_test32_mount() { + local rc=0 trap 0 - $UMOUNT $DIR/$tdir/ext2-mountpoint + local loopdev=$(losetup -a | grep $EXT2_DEV | sed -ne 's/:.*$/p') + $UMOUNT $DIR/$tdir/ext2-mountpoint || rc=$? + losetup -d $loopdev || true + rm -rf $DIR/$tdir/ext2-mountpoint + return $rc } test_32a() { @@ -2563,8 +2636,13 @@ test_32p() { run_test 32p "open d32p/symlink->tmp/symlink->lustre-root/$tfile" cleanup_testdir_mount() { + local rc=0 trap 0 - $UMOUNT $DIR/$tdir + local loopdev=$(losetup -a | grep $EXT2_DEV | sed -ne 's/:.*$/p') + $UMOUNT $DIR/$tdir || rc=$? + losetup -d $loopdev || true + rm -rf $DIR/$tdir + return $rc } test_32q() { @@ -2764,6 +2842,7 @@ cleanup_33f() { test_33f() { [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return mkdir $DIR/$tdir chmod go+rwx $DIR/$tdir @@ -2786,6 +2865,15 @@ test_33f() { } run_test 33f "nonroot user can create, access, and remove a striped directory" +test_33g() { + mkdir -p $DIR/$tdir/dir2 + + local err=$($RUNAS mkdir $DIR/$tdir/dir2 2>&1) + echo $err + [[ $err =~ "exists" ]] || error "Not exists error" +} +run_test 33g "nonroot user create already existing root created file" + TEST_34_SIZE=${TEST_34_SIZE:-2000000000000} test_34a() { rm -f $DIR/f34 @@ -3039,7 +3127,7 @@ test_38() { } run_test 38 "open a regular file with O_DIRECTORY should return -ENOTDIR ===" -test_39() { +test_39a() { # was test_39 touch $DIR/$tfile touch $DIR/${tfile}2 # ls -l $DIR/$tfile $DIR/${tfile}2 @@ -3057,7 +3145,7 @@ test_39() { error "O_TRUNC didn't change timestamps" fi } -run_test 39 "mtime changed on create ===========================" +run_test 39a "mtime changed on create ===========================" test_39b() { test_mkdir -p -c1 $DIR/$tdir @@ -3332,29 +3420,27 @@ test_39l() { # test setting directory atime to future touch -a -d @$TEST_39_ATIME $DIR/$tdir local atime=$(stat -c %X $DIR/$tdir) - [ "$atime" = $TEST_39_ATIME ] || \ + [ "$atime" = $TEST_39_ATIME ] || error "atime is not set to future: $atime, $TEST_39_ATIME" # test setting directory atime from future to now - local d1=$(date +%s) - ls $DIR/$tdir - local d2=$(date +%s) + local now=$(date +%s) + touch -a -d @$now $DIR/$tdir - cancel_lru_locks mdc atime=$(stat -c %X $DIR/$tdir) - [ "$atime" -ge "$d1" -a "$atime" -le "$d2" ] || \ - error "atime is not updated from future: $atime, $d1 dir atime + atime_diff - d1=$(date +%s) + local d1=$(date +%s) ls $DIR/$tdir - d2=$(date +%s) + local d2=$(date +%s) cancel_lru_locks mdc atime=$(stat -c %X $DIR/$tdir) - [ "$atime" -ge "$d1" -a "$atime" -le "$d2" ] || \ + [ "$atime" -ge "$d1" -a "$atime" -le "$d2" ] || error "atime is not updated : $atime, should be $d2" do_facet $SINGLEMDS lctl set_param -n mdd.*MDT0000*.atime_diff=60 @@ -3364,7 +3450,7 @@ test_39l() { ls $DIR/$tdir cancel_lru_locks mdc atime=$(stat -c %X $DIR/$tdir) - [ "$atime" -ge "$d1" -a "$atime" -le "$d2" ] || \ + [ "$atime" -ge "$d1" -a "$atime" -le "$d2" ] || error "atime is updated to $atime, should remain $d1 /dev/null } -run_test 44 "zero length read from a sparse stripe =============" +run_test 44A "zero length read from a sparse stripe =============" test_44a() { local nstripe=$($LCTL lov_getconfig $DIR | grep default_stripe_count: | @@ -3902,7 +4001,6 @@ test_48b() { # bug 2399 test_mkdir .foo && error "'mkdir .foo' worked after removing cwd" ls . > /dev/null && error "'ls .' worked after removing cwd" ls .. > /dev/null || error "'ls ..' failed after removing cwd" - is_patchless || ( cd . && error "'cd .' worked after removing cwd" ) test_mkdir . && error "'mkdir .' worked after removing cwd" rmdir . && error "'rmdir .' worked after removing cwd" ln -s . foo && error "'ln -s .' worked after removing cwd" @@ -3923,8 +4021,6 @@ test_48c() { # bug 2350 test_mkdir .foo && error "mkdir .foo worked after removing cwd" $TRACE ls . && error "'ls .' worked after removing cwd" $TRACE ls .. || error "'ls ..' failed after removing cwd" - is_patchless || ( $TRACE cd . && - error "'cd .' worked after removing cwd" ) $TRACE test_mkdir . && error "'mkdir .' worked after removing cwd" $TRACE rmdir . && error "'rmdir .' worked after removing cwd" $TRACE ln -s . foo && error "'ln -s .' worked after removing cwd" @@ -3946,13 +4042,10 @@ test_48d() { # bug 2350 test_mkdir .foo && error "mkdir .foo worked after removing parent" $TRACE ls . && error "'ls .' worked after removing parent" $TRACE ls .. && error "'ls ..' worked after removing parent" - is_patchless || ( $TRACE cd . && - error "'cd .' worked after recreate parent" ) $TRACE test_mkdir . && error "'mkdir .' worked after removing parent" $TRACE rmdir . && error "'rmdir .' worked after removing parent" $TRACE ln -s . foo && error "'ln -s .' worked after removing parent" - is_patchless || ( $TRACE cd .. && - error "'cd ..' worked after removing parent" || true ) + true } run_test 48d "Access removed parent subdir (should return errors)" @@ -3976,6 +4069,7 @@ run_test 48e "Access to recreated parent subdir (should return errors)" test_49() { # LU-1030 [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_ost_nodsh && skip "remote OST with nodsh" && return # get ost1 size - lustre-OST0000 ost1_size=$(do_facet ost1 $LFS df | grep ${ost1_svc} | awk '{ print $4 }') @@ -4027,87 +4121,75 @@ test_51a() { # was test_51 } run_test 51a "special situations: split htree with empty entry ==" -export NUMTEST=70000 +cleanup_print_lfs_df () { + trap 0 + $LFS df + $LFS df -i +} + test_51b() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - local BASE=$DIR/d${base}.${TESTSUITE} + local dir=$DIR/$tdir + + local nrdirs=$((65536 + 100)) # cleanup the directory - rm -fr $BASE + rm -fr $dir - test_mkdir -p -c1 $BASE + test_mkdir -p -c1 $dir $LFS df $LFS df -i - local mdtidx=$(printf "%04x" $($LFS getstripe -M $BASE)) + local mdtidx=$(printf "%04x" $($LFS getstripe -M $dir)) local numfree=$(lctl get_param -n mdc.$FSNAME-MDT$mdtidx*.filesfree) - [[ $numfree -lt 21000 ]] && + [[ $numfree -lt $nrdirs ]] && skip "not enough free inodes ($numfree) on MDT$mdtidx" && return - [[ $numfree -lt $NUMTEST ]] && NUMTEST=$(($numfree - 50)) && - echo "reduced count to $NUMTEST due to inodes on MDT$mdtidx" - # need to check free space for the directories as well local blkfree=$(lctl get_param -n mdc.$FSNAME-MDT$mdtidx*.kbytesavail) - numfree=$((blkfree / 4)) - [[ $numfree -lt $NUMTEST ]] && NUMTEST=$((numfree - 50)) && - echo "reduced count to $NUMTEST due to blocks on MDT$mdtidx" - - createmany -d $BASE/d $NUMTEST && echo $NUMTEST > $BASE/fnum || - { - $LFS df - $LFS df -i - echo "failed" > $BASE/fnum - error "failed to create $NUMTEST subdirs in MDT$mdtidx:$BASE" - } -} -run_test 51b "exceed 64k subdirectory nlink limit" + numfree=$(( blkfree / $(fs_inode_ksize) )) + [[ $numfree -lt $nrdirs ]] && skip "not enough blocks ($numfree)" && + return -test_51ba() { # LU-993 - local BASE=$DIR/d${base}.${TESTSUITE} - # unlink all but 100 subdirectories, then check it still works - local LEFT=100 - [ -f $BASE/fnum ] && local NUMPREV=$(cat $BASE/fnum) && rm $BASE/fnum + trap cleanup_print_lfsdf EXIT + + # create files + createmany -d $dir/d $nrdirs || + error "failed to create $nrdirs subdirs in MDT$mdtidx:$dir" + + # really created : + nrdirs=$(ls -U $dir | wc -l) - [ "$NUMPREV" != "failed" ] && NUMTEST=$NUMPREV - local DELETE=$((NUMTEST - LEFT)) + # unlink all but 100 subdirectories, then check it still works + local left=100 + local delete=$((nrdirs - left)) - # continue on to run this test even if 51b didn't finish, - # just to delete the many subdirectories created. - [ ! -d "${BASE}/d1" ] && skip "test_51b() not run" && return 0 + $LFS df + $LFS df -i # for ldiskfs the nlink count should be 1, but this is OSD specific # and so this is listed for informational purposes only - echo "nlink before: $(stat -c %h $BASE), created before: $NUMTEST" - unlinkmany -d $BASE/d $DELETE - RC=$? + echo "nlink before: $(stat -c %h $dir), created before: $nrdirs" + unlinkmany -d $dir/d $delete || + error "unlink of first $delete subdirs failed" - if [ $RC -ne 0 ]; then - if [ "$NUMPREV" == "failed" ]; then - skip "previous setup failed" - return 0 - else - error "unlink of first $DELETE subdirs failed" - return $RC - fi - fi + echo "nlink between: $(stat -c %h $dir)" + local found=$(ls -U $dir | wc -l) + [ $found -ne $left ] && + error "can't find subdirs: found only $found, expected $left" - echo "nlink between: $(stat -c %h $BASE)" - # trim the first line of ls output - local FOUND=$(($(ls -l ${BASE} | wc -l) - 1)) - [ $FOUND -ne $LEFT ] && - error "can't find subdirs: found only $FOUND/$LEFT" - - unlinkmany -d $BASE/d $DELETE $LEFT || - error "unlink of second $LEFT subdirs failed" + unlinkmany -d $dir/d $delete $left || + error "unlink of second $left subdirs failed" # regardless of whether the backing filesystem tracks nlink accurately # or not, the nlink count shouldn't be more than "." and ".." here - local AFTER=$(stat -c %h $BASE) - [[ $AFTER -gt 2 ]] && error "nlink after: $AFTER > 2" || - echo "nlink after: $AFTER" + local after=$(stat -c %h $dir) + [[ $after -gt 2 ]] && error "nlink after: $after > 2" || + echo "nlink after: $after" + + cleanup_print_lfs_df } -run_test 51ba "verify nlink for many subdirectory cleanup" +run_test 51b "exceed 64k subdirectory nlink limit on create, verify unlink" test_51d() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return @@ -4115,11 +4197,11 @@ test_51d() { skip_env "skipping test with few OSTs" && return test_mkdir -p $DIR/$tdir createmany -o $DIR/$tdir/t- 1000 - $GETSTRIPE $DIR/$tdir > $TMP/files + $GETSTRIPE $DIR/$tdir > $TMP/$tfile for N in $(seq 0 $((OSTCOUNT - 1))); do OBJS[$N]=$(awk -vobjs=0 '($1 == '$N') { objs += 1 } \ - END { printf("%0.0f", objs) }' $TMP/files) - OBJS0[$N]=$(grep -A 1 idx $TMP/files | awk -vobjs=0 \ + END { printf("%0.0f", objs) }' $TMP/$tfile) + OBJS0[$N]=$(grep -A 1 idx $TMP/$tfile | awk -vobjs=0 \ '($1 == '$N') { objs += 1 } \ END { printf("%0.0f", objs) }') log "OST$N has ${OBJS[$N]} objects, ${OBJS0[$N]} are index 0" @@ -4143,8 +4225,9 @@ test_51d() { " (${OBJS0[$N]} < ${OBJS0[$NLAST]}" NLAST=$N done + rm -f $TMP/$tfile } -run_test 51d "check object distribution ====================" +run_test 51d "check object distribution" test_51e() { if [ "$(facet_fstype $SINGLEMDS)" != ldiskfs ]; then @@ -4178,10 +4261,10 @@ test_52a() { lsattr $DIR/$tdir/foo | egrep -q "^-+a[-e]+ $DIR/$tdir/foo" || error "lsattr" chattr -a $DIR/$tdir/foo || error "chattr -a failed" - cp -r $DIR/$tdir /tmp/ - rm -fr $DIR/$tdir || error "cleanup rm failed" + cp -r $DIR/$tdir $TMP/ + rm -fr $DIR/$tdir $TMP/$tdir || error "cleanup rm failed" } -run_test 52a "append-only flag test (should return errors) =====" +run_test 52a "append-only flag test (should return errors)" test_52b() { [ -f $DIR/$tdir/foo ] && chattr -i $DIR/$tdir/foo @@ -4302,6 +4385,7 @@ find_loop_dev() { } cleanup_54c() { + local rc=0 loopdev="$DIR/loop54c" trap 0 @@ -4376,30 +4460,47 @@ test_56a() { # was test_56 error "$GETSTRIPE $DIR/$tdir: found $FILENUM, not $NUMFILES" echo "$GETSTRIPE --recursive passed." - # test lfs getstripe with file instead of dir + # test lfs getstripe with file instead of dir FILENUM=$($GETSTRIPE $DIR/$tdir/file1 | grep -c obdidx) [[ $FILENUM -eq 1 ]] || error "$GETSTRIPE $DIR/$tdir/file1: found $FILENUM, not 1" echo "$GETSTRIPE file1 passed." - #test lfs getstripe with --verbose + #test lfs getstripe with --verbose [[ $($GETSTRIPE --verbose $DIR/$tdir | grep -c lmm_magic) -eq $NUMFILES ]] || error "$GETSTRIPE --verbose $DIR/$tdir: want $NUMFILES" [[ $($GETSTRIPE $DIR/$tdir | grep -c lmm_magic) -eq 0 ]] || - rror "$GETSTRIPE $DIR/$tdir: showed lmm_magic" + error "$GETSTRIPE $DIR/$tdir: showed lmm_magic" + + #test lfs getstripe with -v prints lmm_fid + [[ $($GETSTRIPE -v $DIR/$tdir | grep -c lmm_fid) -eq $NUMFILES ]] || + error "$GETSTRIPE -v $DIR/$tdir: want $NUMFILES lmm_fid: lines" + [[ $($GETSTRIPE $DIR/$tdir | grep -c lmm_fid) -eq 0 ]] || + error "$GETSTRIPE $DIR/$tdir: showed lmm_fid" echo "$GETSTRIPE --verbose passed." - #test lfs getstripe with --obd - $GETSTRIPE --obd wrong_uuid $DIR/$tdir 2>&1 | + #check for FID information + local fid1=$($GETSTRIPE --fid $DIR/$tdir/file1) + local fid2=$($GETSTRIPE --verbose $DIR/$tdir/file1 | + awk '/lmm_fid: / { print $2 }') + local fid3=$($LFS path2fid $DIR/$tdir/file1) + [ "$fid1" != "$fid2" ] && + error "getstripe --fid $fid1 != getstripe --verbose $fid2" + [ "$fid1" != "$fid3" ] && + error "getstripe --fid $fid1 != lfs path2fid $fid3" + echo "$GETSTRIPE --fid passed." + + #test lfs getstripe with --obd + $GETSTRIPE --obd wrong_uuid $DIR/$tdir 2>&1 | grep -q "unknown obduuid" || error "$GETSTRIPE --obd wrong_uuid should return error message" [[ $OSTCOUNT -lt 2 ]] && - skip_env "skipping other $GETSTRIPE --obd test" && return + skip_env "skipping other $GETSTRIPE --obd test" && return - OSTIDX=1 - OBDUUID=$(ostuuid_from_index $OSTIDX) + OSTIDX=1 + OBDUUID=$(ostuuid_from_index $OSTIDX) FILENUM=$($GETSTRIPE -ir $DIR/$tdir | grep "^$OSTIDX\$" | wc -l) FOUND=$($GETSTRIPE -r --obd $OBDUUID $DIR/$tdir | grep obdidx | wc -l) [[ $FOUND -eq $FILENUM ]] || @@ -4412,6 +4513,26 @@ test_56a() { # was test_56 } run_test 56a "check $GETSTRIPE" +test_56b() { + test_mkdir $DIR/$tdir + NUMDIRS=3 + for i in $(seq 1 $NUMDIRS); do + test_mkdir $DIR/$tdir/dir$i + done + + # test lfs getdirstripe default mode is non-recursion, which is + # different from lfs getstripe + dircnt=$($LFS getdirstripe $DIR/$tdir | grep -c lmv_stripe_count) + [[ $dircnt -eq 1 ]] || + error "$LFS getdirstripe: found $dircnt, not 1" + dircnt=$($LFS getdirstripe --recursive $DIR/$tdir | + grep -c lmv_stripe_count) + [[ $dircnt -eq $((NUMDIRS + 1)) ]] || + error "$LFS getdirstripe --recursive: found $dircnt, \ + not $((NUMDIRS + 1))" +} +run_test 56b "check $LFS getdirstripe" + NUMFILES=3 NUMDIRS=3 setup_56() { @@ -4725,7 +4846,7 @@ run_test 56s "check lfs find -stripe-count works" test_56t() { # LU-611 TDIR=$DIR/${tdir}t - setup_56 $NUMFILES $NUMDIRS "-s 512k" + setup_56 $NUMFILES $NUMDIRS "--stripe-size 512k" $SETSTRIPE -S 256k $TDIR/$tfile.{0,1,2,3} @@ -4960,6 +5081,29 @@ test_56x() { } run_test 56x "lfs migration support" +test_56xa() { + check_swap_layouts_support && return 0 + [[ $OSTCOUNT -lt 2 ]] && + skip_env "need 2 OST, skipping test" && return + + local dir0=$DIR/$tdir/$testnum + test_mkdir -p $dir0 || error "creating dir $dir0" + + local ref1=/etc/passwd + local file1=$dir0/file1 + + $SETSTRIPE -c 2 $file1 + cp $ref1 $file1 + $LFS migrate --block -c 1 $file1 || error "migrate failed rc = $?" + local stripe=$($GETSTRIPE -c $file1) + [[ $stripe == 1 ]] || error "stripe of $file1 is $stripe != 1" + cmp $file1 $ref1 || error "content mismatch $file1 differs from $ref1" + + # clean up + rm -f $file1 +} +run_test 56xa "lfs migration --block support" + test_56y() { [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.4.53) ] && skip "No HSM $(lustre_build_version $SINGLEMDS) MDS < 2.4.53" && @@ -5273,6 +5417,7 @@ run_test 60d "test printk console message masking" test_60e() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return touch $DIR/$tfile #define OBD_FAIL_MDS_LLOG_CREATE_FAILED2 0x15b do_facet mds1 lctl set_param fail_loc=0x15b @@ -5505,34 +5650,59 @@ test_65k() { # bug11679 [[ $OSTCOUNT -lt 2 ]] && skip_env "too few OSTs" && return remote_mds_nodsh && skip "remote MDS with nodsh" && return - echo "Check OST status: " - local MDS_OSCS=`do_facet $SINGLEMDS lctl dl | - awk '/[oO][sS][cC].*md[ts]/ { print $4 }'` + local disable_precreate=true + [ $(lustre_version_code $SINGLEMDS) -le $(version_code 2.8.54) ] && + disable_precreate=false - for OSC in $MDS_OSCS; do - echo $OSC "is activate" - do_facet $SINGLEMDS lctl --device %$OSC activate - done + echo "Check OST status: " + local MDS_OSCS=$(do_facet $SINGLEMDS lctl dl | + awk '/[oO][sS][cC].*md[ts]/ { print $4 }') - mkdir -p $DIR/$tdir - for INACTIVE_OSC in $MDS_OSCS; do - echo "Deactivate: " $INACTIVE_OSC - do_facet $SINGLEMDS lctl --device %$INACTIVE_OSC deactivate - for STRIPE_OSC in $MDS_OSCS; do - OST=`osc_to_ost $STRIPE_OSC` - IDX=`do_facet $SINGLEMDS lctl get_param -n lov.*md*.target_obd | - awk -F: /$OST/'{ print $1 }' | head -n 1` - - [ -f $DIR/$tdir/$IDX ] && continue - echo "$SETSTRIPE -i $IDX -c 1 $DIR/$tdir/$IDX" - $SETSTRIPE -i $IDX -c 1 $DIR/$tdir/$IDX - RC=$? - [ $RC -ne 0 ] && error "setstripe should have succeeded" - done - rm -f $DIR/$tdir/* - echo $INACTIVE_OSC "is Activate." - do_facet $SINGLEMDS lctl --device %$INACTIVE_OSC activate - done + for OSC in $MDS_OSCS; do + echo $OSC "is active" + do_facet $SINGLEMDS lctl --device %$OSC activate + done + + for INACTIVE_OSC in $MDS_OSCS; do + local ost=$(osc_to_ost $INACTIVE_OSC) + local ostnum=$(do_facet $SINGLEMDS lctl get_param -n \ + lov.*md*.target_obd | + awk -F: /$ost/'{ print $1 }' | head -n 1) + + mkdir -p $DIR/$tdir + $SETSTRIPE -i $ostnum -c 1 $DIR/$tdir + createmany -o $DIR/$tdir/$tfile.$ostnum. 1000 + + echo "Deactivate: " $INACTIVE_OSC + do_facet $SINGLEMDS lctl --device %$INACTIVE_OSC deactivate + + local count=$(do_facet $SINGLEMDS "lctl get_param -n \ + osp.$ost*MDT0000.create_count") + local max_count=$(do_facet $SINGLEMDS "lctl get_param -n \ + osp.$ost*MDT0000.max_create_count") + $disable_precreate && + do_facet $SINGLEMDS "lctl set_param -n \ + osp.$ost*MDT0000.max_create_count=0" + + for idx in $(seq 0 $((OSTCOUNT - 1))); do + [ -f $DIR/$tdir/$idx ] && continue + echo "$SETSTRIPE -i $idx -c 1 $DIR/$tdir/$idx" + $SETSTRIPE -i $idx -c 1 $DIR/$tdir/$idx || + error "setstripe $idx should succeed" + rm -f $DIR/$tdir/$idx || error "rm $idx failed" + done + unlinkmany $DIR/$tdir/$tfile.$ostnum. 1000 + rmdir $DIR/$tdir + + do_facet $SINGLEMDS "lctl set_param -n \ + osp.$ost*MDT0000.max_create_count=$max_count" + do_facet $SINGLEMDS "lctl set_param -n \ + osp.$ost*MDT0000.create_count=$count" + do_facet $SINGLEMDS lctl --device %$INACTIVE_OSC activate + echo $INACTIVE_OSC "is Activate" + + wait_osc_import_state mds ost$ostnum FULL + done } run_test 65k "validate manual striping works properly with deactivated OSCs" @@ -5544,6 +5714,12 @@ test_65l() { # bug 12836 } run_test 65l "lfs find on -1 stripe dir ========================" +test_65m() { + $RUNAS $SETSTRIPE -c 2 $MOUNT && error "setstripe should fail" + true +} +run_test 65m "normal user can't set filesystem default stripe" + # bug 2543 - update blocks count on client test_66() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return @@ -5570,10 +5746,6 @@ cleanup_68() { rm -f $LLOOP unset LLOOP fi - if [ ! -z "$LLITELOOPLOAD" ]; then - rmmod llite_lloop - unset LLITELOOPLOAD - fi rm -f $DIR/f68* } @@ -5585,74 +5757,6 @@ swap_used() { swapon -s | awk '($1 == "'$1'") { print $4 }' } -# test case for lloop driver, basic function -test_68a() { - [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - [ "$UID" != 0 ] && skip_env "must run as root" && return - llite_lloop_enabled || \ - { skip_env "llite_lloop module disabled" && return; } - - trap cleanup_68 EXIT - - if ! module_loaded llite_lloop; then - if load_module llite/llite_lloop; then - LLITELOOPLOAD=yes - else - skip_env "can't find module llite_lloop" - return - fi - fi - - LLOOP=$TMP/lloop.`date +%s`.`date +%N` - dd if=/dev/zero of=$DIR/f68a bs=4k count=1024 - $LCTL blockdev_attach $DIR/f68a $LLOOP || error "attach failed" - - directio rdwr $LLOOP 0 1024 4096 || error "direct write failed" - directio rdwr $LLOOP 0 1025 4096 && error "direct write should fail" - - cleanup_68 -} -run_test 68a "lloop driver - basic test ========================" - -# excercise swapping to lustre by adding a high priority swapfile entry -# and then consuming memory until it is used. -test_68b() { # was test_68 - [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - [ "$UID" != 0 ] && skip_env "must run as root" && return - lctl get_param -n devices | grep -q obdfilter && \ - skip "local OST" && return - - grep -q llite_lloop /proc/modules - [ $? -ne 0 ] && skip "can't find module llite_lloop" && return - - [ -z "`$LCTL list_nids | grep -v tcp`" ] && \ - skip "can't reliably test swap with TCP" && return - - MEMTOTAL=`meminfo MemTotal` - NR_BLOCKS=$((MEMTOTAL>>8)) - [[ $NR_BLOCKS -le 2048 ]] && NR_BLOCKS=2048 - - LLOOP=$TMP/lloop.`date +%s`.`date +%N` - dd if=/dev/zero of=$DIR/f68b bs=64k seek=$NR_BLOCKS count=1 - mkswap $DIR/f68b - - $LCTL blockdev_attach $DIR/f68b $LLOOP || error "attach failed" - - trap cleanup_68 EXIT - - swapon -p 32767 $LLOOP || error "swapon $LLOOP failed" - - echo "before: `swapon -s | grep $LLOOP`" - $MEMHOG $MEMTOTAL || error "error allocating $MEMTOTAL kB" - echo "after: `swapon -s | grep $LLOOP`" - SWAPUSED=`swap_used $LLOOP` - - cleanup_68 - - [ $SWAPUSED -eq 0 ] && echo "no swap used???" || true -} -run_test 68b "support swapping to Lustre ========================" - # bug5265, obdfilter oa2dentry return -ENOENT # #define OBD_FAIL_SRV_ENOENT 0x217 test_69() { @@ -5829,8 +5933,8 @@ set_inode_slab_tunables() { test_76() { # Now for bug 20433, added originally in bug 1443 [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - local SLAB_SETTINGS=`get_inode_slab_tunables` - local CPUS=`getconf _NPROCESSORS_ONLN` + local SLAB_SETTINGS=$(get_inode_slab_tunables) + local CPUS=$(getconf _NPROCESSORS_ONLN 2>/dev/null) # we cannot set limit below 1 which means 1 inode in each # per-cpu cache is still allowed set_inode_slab_tunables "1 1 0" @@ -5847,7 +5951,7 @@ test_76() { # Now for bug 20433, added originally in bug 1443 AFTER_INODES=$(num_inodes) echo "after inodes: $AFTER_INODES" local wait=0 - while [[ $((AFTER_INODES-1*CPUS)) -gt $BEFORE_INODES ]]; do + while [[ $((AFTER_INODES-1*${CPUS:-1})) -gt $BEFORE_INODES ]]; do sleep 2 AFTER_INODES=$(num_inodes) wait=$((wait+2)) @@ -6033,6 +6137,11 @@ run_test 77j "client only supporting ADLER32" rm -f $F77_TMP unset F77_TMP +cleanup_test_78() { + trap 0 + rm -f $DIR/$tfile +} + test_78() { # bug 10901 [ $PARALLEL == "yes" ] && skip "skip parallel run" && return remote_ost || { skip_env "local OST" && return; } @@ -6062,6 +6171,8 @@ test_78() { # bug 10901 [[ $SMALLESTOST -lt 10240 ]] && skip "too small OSTSIZE, useless to run large O_DIRECT test" && return 0 + trap cleanup_test_78 EXIT + [[ $F78SIZE -gt $((SMALLESTOST * $OSTCOUNT / 1024 - 80)) ]] && F78SIZE=$((SMALLESTOST * $OSTCOUNT / 1024 - 80)) @@ -6074,7 +6185,7 @@ test_78() { # bug 10901 $DIRECTIO rdwr $DIR/$tfile 0 $FSIZE 1048576||error "rdwr failed" done - rm -f $DIR/$tfile + cleanup_test_78 } run_test 78 "handle large O_DIRECT writes correctly ============" @@ -6553,41 +6664,95 @@ test_101e() { } run_test 101e "check read-ahead for small read(1k) for small files(500k)" -cleanup_test101f() { - trap 0 - $LCTL set_param -n llite.*.max_read_ahead_whole_mb $MAX_WHOLE_MB - rm -rf $DIR/$tfile 2>/dev/null +test_101f() { + which iozone || { skip "no iozone installed" && return; } + + local old_debug=$($LCTL get_param debug) + old_debug=${old_debug#*=} + $LCTL set_param debug="reada mmap" + + # create a test file + iozone -i 0 -+n -r 1m -s 128m -w -f $DIR/$tfile > /dev/null 2>&1 + + echo Cancel LRU locks on lustre client to flush the client cache + cancel_lru_locks osc + + echo Reset readahead stats + $LCTL set_param -n llite.*.read_ahead_stats 0 + + echo mmap read the file with small block size + iozone -i 1 -u 1 -l 1 -+n -r 32k -s 128m -B -f $DIR/$tfile \ + > /dev/null 2>&1 + + echo checking missing pages + $LCTL get_param llite.*.read_ahead_stats + local miss=$($LCTL get_param -n llite.*.read_ahead_stats | + get_named_value 'misses' | cut -d" " -f1 | calc_total) + + $LCTL set_param debug="$old_debug" + [ $miss -lt 3 ] || error "misses too much pages ('$miss')!" + rm -f $DIR/$tfile } +run_test 101f "check mmap read performance" -test_101f() { - [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - local file=$DIR/$tfile - local nreads=1000 +test_101g() { + local rpcs + local osts=$(get_facets OST) + local list=$(comma_list $(osts_nodes)) + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" - MAX_WHOLE_MB=$($LCTL get_param -n llite.*.max_read_ahead_whole_mb) - $LCTL set_param -n llite.*.max_read_ahead_whole_mb 2 - dd if=/dev/zero of=${file} bs=2097152 count=1 2>/dev/null - trap cleanup_test101f EXIT + save_lustre_params $osts "obdfilter.*.brw_size" > $p - echo Cancel LRU locks on lustre client to flush the client cache - cancel_lru_locks osc + $LFS setstripe -c 1 $DIR/$tfile + + if [ $(lustre_version_code ost1) -ge $(version_code 2.8.52) ]; then + set_osd_param $list '' brw_size 16M + + echo "remount client to enable large RPC size" + remount_client $MOUNT || error "remount_client failed" + + for mp in $($LCTL get_param -n osc.*.max_pages_per_rpc); do + [ "$mp" -eq 4096 ] || + error "max_pages_per_rpc not correctly set" + done + + $LCTL set_param -n osc.*.rpc_stats=0 + + # 10*16 MiB should be enough for the test + dd if=/dev/zero of=$DIR/$tfile bs=16M count=10 + cancel_lru_locks osc + dd of=/dev/null if=$DIR/$tfile bs=16M count=10 + + # calculate 16 MiB RPCs + rpcs=$($LCTL get_param 'osc.*.rpc_stats' | + sed -n '/pages per rpc/,/^$/p' | + awk 'BEGIN { sum = 0 }; /4096:/ { sum += $2 }; + END { print sum }') + echo $rpcs RPCs + [ "$rpcs" -eq 10 ] || error "not all RPCs are 16 MiB BRW rpcs" + fi + + echo "set RPC size to 4MB" + + $LCTL set_param -n osc.*.max_pages_per_rpc=4M osc.*.rpc_stats=0 + dd if=/dev/zero of=$DIR/$tfile bs=4M count=25 + cancel_lru_locks osc + dd of=/dev/null if=$DIR/$tfile bs=4M count=25 - echo Reset readahead stats - $LCTL set_param -n llite.*.read_ahead_stats 0 - # Random read in a 2M file, because max_read_ahead_whole_mb = 2M, - # readahead should read in 2M file on second read, so only miss - # 2 pages. - echo Random 4K reads on 2M file for 1000 times - $READS -f $file -s 2097152 -b 4096 -n $nreads + # calculate 4 MiB RPCs + rpcs=$($LCTL get_param 'osc.*.rpc_stats' | + sed -n '/pages per rpc/,/^$/p' | + awk 'BEGIN { sum = 0 }; /1024:/ { sum += $2 }; + END { print sum }') + echo $rpcs RPCs + [ "$rpcs" -eq 25 ] || error "not all RPCs are 4 MiB BRW rpcs" - echo checking missing pages - local miss=$($LCTL get_param -n llite.*.read_ahead_stats | - get_named_value 'misses' | cut -d" " -f1 | calc_total) + restore_lustre_params < $p + remount_client $MOUNT || error "remount_client failed" - [ $miss -lt 3 ] || error "misses too much pages!" - cleanup_test101f + rm -f $p $DIR/$tfile } -run_test 101f "check read-ahead for max_read_ahead_whole_mb" +run_test 101g "Big bulk(4/16 MiB) readahead" setup_test102() { test_mkdir -p $DIR/$tdir @@ -6958,29 +7123,31 @@ getxattr() { # getxattr path name } test_102n() { # LU-4101 mdt: protect internal xattrs - local file0=$DIR/$tfile.0 - local file1=$DIR/$tfile.1 - local xattr0=$TMP/$tfile.0 - local xattr1=$TMP/$tfile.1 - local name - local value - [ -z "$(which setfattr 2>/dev/null)" ] && skip "could not find setfattr" && return - if [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.5.50) ] then skip "MDT < 2.5.50 allows setxattr on internal trusted xattrs" return fi + local file0=$DIR/$tfile.0 + local file1=$DIR/$tfile.1 + local xattr0=$TMP/$tfile.0 + local xattr1=$TMP/$tfile.1 + local namelist="lov lma lmv link fid version som hsm" + local name + local value + rm -rf $file0 $file1 $xattr0 $xattr1 touch $file0 $file1 # Get 'before' xattrs of $file1. getfattr --absolute-names --dump --match=- $file1 > $xattr0 - for name in lov lma lmv link fid version som hsm lfsck_namespace; do + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.53) ] && + namelist+=" lfsck_namespace" + for name in $namelist; do # Try to copy xattr from $file0 to $file1. value=$(getxattr $file0 trusted.$name 2> /dev/null) @@ -7104,6 +7271,7 @@ test_103a() { [ -z "$(which setfacl 2>/dev/null)" ] && skip_env "could not find setfacl" && return $GSS && skip "could not run under gss" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return gpasswd -a daemon bin # LU-5641 do_facet $SINGLEMDS gpasswd -a daemon bin # LU-5641 @@ -7116,7 +7284,8 @@ test_103a() { SAVE_UMASK=$(umask) umask 0022 - cd $DIR + mkdir -p $DIR/$tdir + cd $DIR/$tdir echo "performing cp ..." run_acl_subtest cp || error "run_acl_subtest cp failed" @@ -7126,6 +7295,15 @@ test_103a() { run_acl_subtest misc || error "misc test failed" echo "performing permissions..." run_acl_subtest permissions || error "permissions failed" + # LU-1482 mdd: Setting xattr are properly checked with and without ACLs + if [ $(lustre_version_code $SINGLEMDS) -gt $(version_code 2.8.55) -o \ + \( $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.6) -a \ + $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.5.29) \) ] + then + echo "performing permissions xattr..." + run_acl_subtest permissions_xattr || + error "permissions_xattr failed" + fi echo "performing setfacl..." run_acl_subtest setfacl || error "setfacl test failed" @@ -7164,6 +7342,7 @@ test_103a() { run_test 103a "acl test =========================================" test_103b() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return local noacl=false local MDT_DEV=$(mdsdevname ${SINGLEMDS//mds/}) local mountopts=$MDS_MOUNT_OPTS @@ -7498,9 +7677,10 @@ test_116a() { # was previously test_116() echo "Wrote ${DIFF}KB to smaller OST $MINI1" DIFF2=$(($MAXV1 - ${AVAIL[$MAXI1]})) echo "Wrote ${DIFF2}KB to larger OST $MAXI1" - FILL=$(($DIFF2 * 100 / $DIFF - 100)) - [ $DIFF -gt 0 ] && + if [[ $DIFF -gt 0 ]]; then + FILL=$(($DIFF2 * 100 / $DIFF - 100)) echo "Wrote ${FILL}% more data to larger OST $MAXI1" + fi # Figure out which files were written where UUID=$(lctl get_param -n lov.${FSNAME}-clilov-*.target_obd | @@ -7513,9 +7693,10 @@ test_116a() { # was previously test_116() echo $UUID MAXC=$($GETSTRIPE --ost $UUID $DIR/$tdir | grep $DIR | wc -l) echo "$MAXC files created on larger OST $MAXI1" - FILL=$(($MAXC * 100 / $MINC - 100)) - [[ $MINC -gt 0 ]] && + if [[ $MINC -gt 0 ]]; then + FILL=$(($MAXC * 100 / $MINC - 100)) echo "Wrote ${FILL}% more files to larger OST $MAXI1" + fi [[ $MAXC -gt $MINC ]] || error_ignore LU-9 "stripe QOS didn't balance free space" simple_cleanup_common @@ -8021,6 +8202,7 @@ run_test 119d "The DIO path should try to send a new rpc once one is completed" test_120a() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return test_mkdir -p $DIR/$tdir [ -z "`lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel`" ] && \ skip "no early lock cancel on server" && return 0 @@ -8052,6 +8234,7 @@ run_test 120a "Early Lock Cancel: mkdir test" test_120b() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return test_mkdir $DIR/$tdir [ -z "$(lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel)" ] && \ skip "no early lock cancel on server" && return 0 @@ -8079,6 +8262,7 @@ run_test 120b "Early Lock Cancel: create test" test_120c() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return test_mkdir -c1 $DIR/$tdir [ -z "$(lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel)" ] && \ skip "no early lock cancel on server" && return 0 @@ -8109,6 +8293,7 @@ run_test 120c "Early Lock Cancel: link test" test_120d() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return test_mkdir -p -c1 $DIR/$tdir [ -z "$(lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel)" ] && \ skip "no early lock cancel on server" && return 0 @@ -8137,18 +8322,24 @@ run_test 120d "Early Lock Cancel: setattr test" test_120e() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - test_mkdir -p -c1 $DIR/$tdir - [ -z "`lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel`" ] && \ - skip "no early lock cancel on server" && return 0 - lru_resize_disable mdc - lru_resize_disable osc - dd if=/dev/zero of=$DIR/$tdir/f1 count=1 - cancel_lru_locks mdc - cancel_lru_locks osc - dd if=$DIR/$tdir/f1 of=/dev/null - stat $DIR/$tdir $DIR/$tdir/f1 > /dev/null + ! $($LCTL get_param -n mdc.*.connect_flags | grep -q early_lock_can) && + skip "no early lock cancel on server" && return 0 + remote_mds_nodsh && skip "remote MDS with nodsh" && return + local dlmtrace_set=false + + test_mkdir -p -c1 $DIR/$tdir + lru_resize_disable mdc + lru_resize_disable osc + ! $LCTL get_param debug | grep -q dlmtrace && + $LCTL set_param debug=+dlmtrace && dlmtrace_set=true + dd if=/dev/zero of=$DIR/$tdir/f1 count=1 + cancel_lru_locks mdc + cancel_lru_locks osc + dd if=$DIR/$tdir/f1 of=/dev/null + stat $DIR/$tdir $DIR/$tdir/f1 > /dev/null # XXX client can not do early lock cancel of OST lock # during unlink (LU-4206), so cancel osc lock now. + sleep 2 cancel_lru_locks osc can1=$(do_facet $SINGLEMDS \ "$LCTL get_param -n ldlm.services.ldlm_canceld.stats" | @@ -8162,8 +8353,11 @@ test_120e() { awk '/ldlm_cancel/ {print $2}') blk2=$($LCTL get_param -n ldlm.services.ldlm_cbd.stats | awk '/ldlm_bl_callback/ {print $2}') - [ $can1 -eq $can2 ] || error $((can2-can1)) "cancel RPC occured." - [ $blk1 -eq $blk2 ] || error $((blk2-blk1)) "blocking RPC occured." + [ $can1 -ne $can2 ] && error "$((can2 - can1)) cancel RPC occured" && + $LCTL dk $TMP/cancel.debug.txt + [ $blk1 -ne $blk2 ] && error "$((blk2 - blk1)) blocking RPC occured" && + $LCTL dk $TMP/blocking.debug.txt + $dlmtrace_set && $LCTL set_param debug=-dlmtrace lru_resize_enable mdc lru_resize_enable osc } @@ -8173,6 +8367,7 @@ test_120f() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ -z "`lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel`" ] && \ skip "no early lock cancel on server" && return 0 + remote_mds_nodsh && skip "remote MDS with nodsh" && return test_mkdir -p -c1 $DIR/$tdir lru_resize_disable mdc lru_resize_disable osc @@ -8187,6 +8382,7 @@ test_120f() { stat $DIR/$tdir/d1 $DIR/$tdir/d2 $DIR/$tdir/d1/f1 $DIR/$tdir/d2/f2 > /dev/null # XXX client can not do early lock cancel of OST lock # during rename (LU-4206), so cancel osc lock now. + sleep 2 cancel_lru_locks osc can1=$(do_facet $SINGLEMDS \ "$LCTL get_param -n ldlm.services.ldlm_canceld.stats" | @@ -8211,6 +8407,7 @@ test_120g() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ -z "`lctl get_param -n mdc.*.connect_flags | grep early_lock_cancel`" ] && \ skip "no early lock cancel on server" && return 0 + remote_mds_nodsh && skip "remote MDS with nodsh" && return lru_resize_disable mdc lru_resize_disable osc count=10000 @@ -8480,11 +8677,18 @@ test_124b() { NR=$(($(default_lru_size)*20)) if [[ $NR -gt $LIMIT ]]; then - log "Limit lock number by $LIMIT locks" - NR=$LIMIT - fi - lru_resize_disable mdc - test_mkdir -p $DIR/$tdir/disable_lru_resize || + log "Limit lock number by $LIMIT locks" + NR=$LIMIT + fi + + IFree=$(mdsrate_inodes_available) + if [ $IFree -lt $NR ]; then + log "Limit lock number by $IFree inodes" + NR=$IFree + fi + + lru_resize_disable mdc + test_mkdir -p $DIR/$tdir/disable_lru_resize || error "failed to create $DIR/$tdir/disable_lru_resize" createmany -o $DIR/$tdir/disable_lru_resize/f $NR @@ -8668,11 +8872,13 @@ test_127b() { # bug LU-333 esac done < $TMP/${tfile}.tmp - #check that we actually got some stats - [ "$read_bytes" ] || error "Missing read_bytes stats" - [ "$write_bytes" ] || error "Missing write_bytes stats" - [ "$read_bytes" != 0 ] || error "no read done" - [ "$write_bytes" != 0 ] || error "no write done" + #check that we actually got some stats + [ "$read_bytes" ] || error "Missing read_bytes stats" + [ "$write_bytes" ] || error "Missing write_bytes stats" + [ "$read_bytes" != 0 ] || error "no read done" + [ "$write_bytes" != 0 ] || error "no write done" + + rm -f $TMP/${tfile}.tmp } run_test 127b "verify the llite client stats are sane" @@ -8684,8 +8890,9 @@ test_128() { # bug 15212 EOF result=$(grep error $TMP/$tfile.log) - rm -f $DIR/$tfile - [ -z "$result" ] || error "consecutive find's under interactive lfs failed" + rm -f $DIR/$tfile $TMP/$tfile.log + [ -z "$result" ] || + error "consecutive find's under interactive lfs failed" } run_test 128 "interactive lfs for 2 consecutive find's" @@ -8724,12 +8931,12 @@ test_129() { return fi remote_mds_nodsh && skip "remote MDS with nodsh" && return - ENOSPC=28 - EFBIG=27 - has_warning=0 + local ENOSPC=28 + local EFBIG=27 + local has_warning=0 rm -rf $DIR/$tdir - test_mkdir -p $DIR/$tdir + mkdir -p $DIR/$tdir # block size of mds1 local MDT_DEV=$(mdsdevname ${SINGLEMDS//mds/}) @@ -8738,9 +8945,6 @@ test_129() { set_dir_limits $MAX $MAX local I=$(stat -c%s "$DIR/$tdir") local J=0 - local STRIPE_COUNT=1 - [[ $MDSCOUNT -ge 2 ]] && STRIPE_COUNT=$($LFS getdirstripe -c $DIR/$tdir) - MAX=$((MAX*STRIPE_COUNT)) while [[ $I -le $MAX ]]; do $MULTIOP $DIR/$tdir/$J Oc rc=$? @@ -8754,13 +8958,14 @@ test_129() { if [ $rc -eq $EFBIG -o $rc -eq $ENOSPC ]; then set_dir_limits 0 0 echo "return code $rc received as expected" - multiop $DIR/$tdir/$J Oc || - error_exit "multiop failed w/o dir size limit" + + createmany -o $DIR/$tdir/$J_file_ 1000 || + error_exit "create failed w/o dir size limit" check_mds_dmesg '"has reached"' || error_exit "has reached message should be output" - [ $has_warning ] || + [ $has_warning -eq 0 ] && error_exit "warning message should be output" I=$(stat -c%s "$DIR/$tdir") @@ -8812,8 +9017,8 @@ test_130a() { skip "ORI-366/LU-1941: FIEMAP unimplemented on ZFS" && return [ $RC != 0 ] && error "filefrag $fm_file failed" - filefrag_op=$(filefrag -ve $fm_file | grep -A 100 "ext:" | - grep -v "ext:" | grep -v "found") + filefrag_op=$(filefrag -ve $fm_file | + sed -n '/ext:/,/found/{/ext:/d; /found/d; p}') lun=$($GETSTRIPE -i $fm_file) start_blk=`echo $filefrag_op | cut -d: -f2 | cut -d. -f1` @@ -8845,10 +9050,7 @@ run_test 130a "FIEMAP (1-stripe file)" test_130b() { [ "$OSTCOUNT" -lt "2" ] && - skip_env "skipping FIEMAP on 2-stripe file test" && return - - [ "$OSTCOUNT" -ge "10" ] && - skip_env "skipping FIEMAP with >= 10 OSTs" && return + skip_env "skipping FIEMAP on $OSTCOUNT-stripe file" && return local filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip_env "filefrag does not support FIEMAP" && @@ -8857,30 +9059,34 @@ test_130b() { trap cleanup_130 EXIT RETURN local fm_file=$DIR/$tfile - $SETSTRIPE -S 65536 -c 2 $fm_file || error "setstripe on $fm_file" + $SETSTRIPE -S 65536 -c $OSTCOUNT $fm_file || + error "setstripe on $fm_file" [ "$(facet_fstype ost$(($($GETSTRIPE -i $fm_file) + 1)))" = "zfs" ] && skip "ORI-366/LU-1941: FIEMAP unimplemented on ZFS" && return - dd if=/dev/zero of=$fm_file bs=1M count=2 || + dd if=/dev/zero of=$fm_file bs=1M count=$OSTCOUNT || error "dd failed on $fm_file" filefrag -ves $fm_file || error "filefrag $fm_file failed" - filefrag_op=$(filefrag -ve $fm_file | grep -A 100 "ext:" | - grep -v "ext:" | grep -v "found") + filefrag_op=$(filefrag -ve $fm_file | + sed -n '/ext:/,/found/{/ext:/d; /found/d; p}') - last_lun=$(echo $filefrag_op | cut -d: -f5) + last_lun=$(echo $filefrag_op | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') IFS=$'\n' tot_len=0 num_luns=1 for line in $filefrag_op do - frag_lun=`echo $line | cut -d: -f5` - ext_len=`echo $line | cut -d: -f4` + frag_lun=$(echo $line | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') + ext_len=$(echo $line | cut -d: -f4) if (( $frag_lun != $last_lun )); then if (( tot_len != 1024 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned len $tot_len for OST $last_lun instead of 256" + error "FIEMAP on $fm_file failed; returned " \ + "len $tot_len for OST $last_lun instead of 1024" return else (( num_luns += 1 )) @@ -8890,25 +9096,23 @@ test_130b() { (( tot_len += ext_len )) last_lun=$frag_lun done - if (( num_luns != 2 || tot_len != 1024 )); then + if (( num_luns != $OSTCOUNT || tot_len != 1024 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned wrong number of luns or wrong len for OST $last_lun" + error "FIEMAP on $fm_file failed; returned wrong number of " \ + "luns or wrong len for OST $last_lun" return fi cleanup_130 - echo "FIEMAP on 2-stripe file succeeded" + echo "FIEMAP on $OSTCOUNT-stripe file succeeded" } -run_test 130b "FIEMAP (2-stripe file)" +run_test 130b "FIEMAP ($OSTCOUNT-stripe file)" test_130c() { [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping FIEMAP on 2-stripe file" && return - [ "$OSTCOUNT" -ge "10" ] && - skip_env "skipping FIEMAP with >= 10 OSTs" && return - filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -8920,30 +9124,36 @@ test_130c() { [ "$(facet_fstype ost$(($($GETSTRIPE -i $fm_file) + 1)))" = "zfs" ] && skip "ORI-366/LU-1941: FIEMAP unimplemented on ZFS" && return - dd if=/dev/zero of=$fm_file seek=1 bs=1M count=1 || error "dd failed on $fm_file" + dd if=/dev/zero of=$fm_file seek=1 bs=1M count=1 || + error "dd failed on $fm_file" filefrag -ves $fm_file || error "filefrag $fm_file failed" - filefrag_op=`filefrag -ve $fm_file | grep -A 100 "ext:" | grep -v "ext:" | grep -v "found"` + filefrag_op=$(filefrag -ve $fm_file | + sed -n '/ext:/,/found/{/ext:/d; /found/d; p}') - last_lun=`echo $filefrag_op | cut -d: -f5` + last_lun=$(echo $filefrag_op | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') IFS=$'\n' tot_len=0 num_luns=1 for line in $filefrag_op do - frag_lun=`echo $line | cut -d: -f5` - ext_len=`echo $line | cut -d: -f4` + frag_lun=$(echo $line | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') + ext_len=$(echo $line | cut -d: -f4) if (( $frag_lun != $last_lun )); then logical=`echo $line | cut -d: -f2 | cut -d. -f1` if (( logical != 512 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned logical start for lun $logical instead of 512" + error "FIEMAP on $fm_file failed; returned " \ + "logical start for lun $logical instead of 512" return fi if (( tot_len != 512 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned len $tot_len for OST $last_lun instead of 1024" + error "FIEMAP on $fm_file failed; returned " \ + "len $tot_len for OST $last_lun instead of 1024" return else (( num_luns += 1 )) @@ -8955,7 +9165,8 @@ test_130c() { done if (( num_luns != 2 || tot_len != 512 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned wrong number of luns or wrong len for OST $last_lun" + error "FIEMAP on $fm_file failed; returned wrong number of " \ + "luns or wrong len for OST $last_lun" return fi @@ -8966,18 +9177,18 @@ test_130c() { run_test 130c "FIEMAP (2-stripe file with hole)" test_130d() { - [ "$OSTCOUNT" -lt "3" ] && skip_env "skipping FIEMAP on N-stripe file test" && return - - [ "$OSTCOUNT" -ge "10" ] && - skip_env "skipping FIEMAP with >= 10 OSTs" && return + [ "$OSTCOUNT" -lt "3" ] && + skip_env "skipping FIEMAP on N-stripe file test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") - [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return + [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && + return trap cleanup_130 EXIT RETURN local fm_file=$DIR/$tfile - $SETSTRIPE -S 65536 -c $OSTCOUNT $fm_file||error "setstripe on $fm_file" + $SETSTRIPE -S 65536 -c $OSTCOUNT $fm_file || + error "setstripe on $fm_file" [ "$(facet_fstype ost$(($($GETSTRIPE -i $fm_file) + 1)))" = "zfs" ] && skip "ORI-366/LU-1941: FIEMAP unimplemented on ZFS" && return @@ -8986,22 +9197,25 @@ test_130d() { error "dd failed on $fm_file" filefrag -ves $fm_file || error "filefrag $fm_file failed" - filefrag_op=`filefrag -ve $fm_file | grep -A 100 "ext:" | - grep -v "ext:" | grep -v "found"` + filefrag_op=$(filefrag -ve $fm_file | + sed -n '/ext:/,/found/{/ext:/d; /found/d; p}') - last_lun=`echo $filefrag_op | cut -d: -f5` + last_lun=$(echo $filefrag_op | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') IFS=$'\n' tot_len=0 num_luns=1 for line in $filefrag_op do - frag_lun=`echo $line | cut -d: -f5` - ext_len=`echo $line | cut -d: -f4` + frag_lun=$(echo $line | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') + ext_len=$(echo $line | cut -d: -f4) if (( $frag_lun != $last_lun )); then if (( tot_len != 1024 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned len $tot_len for OST $last_lun instead of 1024" + error "FIEMAP on $fm_file failed; returned " \ + "len $tot_len for OST $last_lun instead of 1024" return else (( num_luns += 1 )) @@ -9013,7 +9227,8 @@ test_130d() { done if (( num_luns != actual_stripecnt || tot_len != 1024 )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned wrong number of luns or wrong len for OST $last_lun" + error "FIEMAP on $fm_file failed; returned wrong number of " \ + "luns or wrong len for OST $last_lun" return fi @@ -9024,10 +9239,8 @@ test_130d() { run_test 130d "FIEMAP (N-stripe file)" test_130e() { - [ "$OSTCOUNT" -lt "2" ] && skip_env "skipping continuation FIEMAP test" && return - - [ "$OSTCOUNT" -ge "10" ] && - skip_env "skipping FIEMAP with >= 10 OSTs" && return + [ "$OSTCOUNT" -lt "2" ] && + skip_env "skipping continuation FIEMAP test" && return filefrag_op=$(filefrag -e 2>&1 | grep "invalid option") [ -n "$filefrag_op" ] && skip "filefrag does not support FIEMAP" && return @@ -9047,21 +9260,26 @@ test_130e() { done filefrag -ves $fm_file || error "filefrag $fm_file failed" - filefrag_op=`filefrag -ve $fm_file | grep -A 12000 "ext:" | grep -v "ext:" | grep -v "found"` + filefrag_op=$(filefrag -ve $fm_file | + sed -n '/ext:/,/found/{/ext:/d; /found/d; p}') - last_lun=`echo $filefrag_op | cut -d: -f5` + last_lun=$(echo $filefrag_op | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') IFS=$'\n' tot_len=0 num_luns=1 for line in $filefrag_op do - frag_lun=`echo $line | cut -d: -f5` - ext_len=`echo $line | cut -d: -f4` + frag_lun=$(echo $line | cut -d: -f5 | + sed -e 's/^[ \t]*/0x/' | sed -e 's/0x0x/0x/') + ext_len=$(echo $line | cut -d: -f4) if (( $frag_lun != $last_lun )); then if (( tot_len != $EXPECTED_LEN )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned len $tot_len for OST $last_lun instead of $EXPECTED_LEN" + error "FIEMAP on $fm_file failed; returned " \ + "len $tot_len for OST $last_lun instead " \ + "of $EXPECTED_LEN" return else (( num_luns += 1 )) @@ -9073,7 +9291,8 @@ test_130e() { done if (( num_luns != 2 || tot_len != $EXPECTED_LEN )); then cleanup_130 - error "FIEMAP on $fm_file failed; returned wrong number of luns or wrong len for OST $last_lun" + error "FIEMAP on $fm_file failed; returned wrong number " \ + "of luns or wrong len for OST $last_lun" return fi @@ -9163,12 +9382,14 @@ test_133a() { # verify mdt stats first. mkdir ${testdir} || error "mkdir failed" check_stats $SINGLEMDS "mkdir" 1 - touch ${testdir}/${tfile} || "touch failed" + touch ${testdir}/${tfile} || error "touch failed" check_stats $SINGLEMDS "open" 1 check_stats $SINGLEMDS "close" 1 - mknod ${testdir}/${tfile}-pipe p || "mknod failed" - check_stats $SINGLEMDS "mknod" 1 - rm -f ${testdir}/${tfile}-pipe || "pipe remove failed" + [ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.8.54) ] && { + mknod ${testdir}/${tfile}-pipe p || error "mknod failed" + check_stats $SINGLEMDS "mknod" 2 + } + rm -f ${testdir}/${tfile}-pipe || error "pipe remove failed" check_stats $SINGLEMDS "unlink" 1 rm -f ${testdir}/${tfile} || error "file remove failed" check_stats $SINGLEMDS "unlink" 2 @@ -9197,7 +9418,7 @@ test_133b() { remote_mds_nodsh && skip "remote MDS with nodsh" && return local testdir=$DIR/${tdir}/stats_testdir mkdir -p ${testdir} || error "mkdir failed" - touch ${testdir}/${tfile} || "touch failed" + touch ${testdir}/${tfile} || error "touch failed" cancel_lru_locks mdc # clear stats. @@ -9429,7 +9650,8 @@ run_test 133e "Verifying OST {read,write}_bytes nid stats =================" proc_dirs="" for dir in /proc/fs/lustre/ /proc/sys/lnet/ /proc/sys/lustre/ \ - /sys/fs/lustre/ /sys/fs/lnet/ /sys/kernel/debug/lustre/; do + /sys/fs/lustre/ /sys/fs/lnet/ /sys/kernel/debug/lnet/ \ + /sys/kernel/debug/lustre/; do [[ -d $dir ]] && proc_dirs+=" $dir" done @@ -9440,7 +9662,7 @@ test_133f() { find $proc_dirs -exec cat '{}' \; &> /dev/null # Second verifying readability. - $LCTL get_param -R &> /dev/null || error "proc file read failed" + $LCTL get_param -R '*' &> /dev/null || error "proc file read failed" # eventually, this can also be replaced with "lctl get_param -R", # but not until that option is always available on the server @@ -9460,6 +9682,8 @@ test_133f() { run_test 133f "Check for LBUGs/Oopses/unreadable files in /proc" test_133g() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return + remote_ost_nodsh && skip "remote OST with nodsh" && return # Second verifying writability. find $proc_dirs \ -type f \ @@ -9493,6 +9717,7 @@ test_133g() { run_test 133g "Check for Oopses on bad io area writes/reads in /proc" test_134a() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.54) ]] && skip "Need MDS version at least 2.7.54" && return @@ -9501,7 +9726,7 @@ test_134a() { local nsdir="ldlm.namespaces.*-MDT0000-mdc-*" local unused=$($LCTL get_param -n $nsdir.lock_unused_count) - [ $unused -eq 0 ] || "$unused locks are not cleared" + [ $unused -eq 0 ] || error "$unused locks are not cleared" local nr=1000 createmany -o $DIR/$tdir/f $nr || @@ -9528,6 +9753,7 @@ test_134a() { run_test 134a "Server reclaims locks when reaching lock_reclaim_threshold" test_134b() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.54) ]] && skip "Need MDS version at least 2.7.54" && return @@ -9569,9 +9795,9 @@ run_test 134b "Server rejects lock request when reaching lock_limit_mb" test_140() { #bug-17379 [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - test_mkdir -p $DIR/$tdir || error "Creating dir $DIR/$tdir" - cd $DIR/$tdir || error "Changing to $DIR/$tdir" - cp /usr/bin/stat . || error "Copying stat to $DIR/$tdir" + test_mkdir -p $DIR/$tdir || error "Creating dir $DIR/$tdir" + cd $DIR/$tdir || error "Changing to $DIR/$tdir" + cp $(which stat) . || error "Copying stat to $DIR/$tdir" # VFS limits max symlink depth to 5(4KSTACK) or 7(8KSTACK) or 8 # For kernel > 3.5, bellow only tests consecutive symlink (MAX 40) @@ -9919,25 +10145,49 @@ test_154A() { [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.4.1) ]] && skip "Need MDS version at least 2.4.1" && return - touch $DIR/$tfile - local FID=$($LFS path2fid $DIR/$tfile) - [ -z "$FID" ] && error "path2fid unable to get $DIR/$tfile FID" + local tf=$DIR/$tfile + touch $tf - # check that we get the same pathname back - local FOUND=$($LFS fid2path $MOUNT "$FID") - [ -z "$FOUND" ] && error "fid2path unable to get $FID path" - [ "$FOUND" != "$DIR/$tfile" ] && - error "fid2path(path2fid($DIR/$tfile)) = $FOUND != $DIR/$tfile" + local fid=$($LFS path2fid $tf) + [ -z "$fid" ] && error "path2fid unable to get $tf FID" - rm -rf $DIR/$tfile + # check that we get the same pathname back + local found=$($LFS fid2path $MOUNT "$fid") + [ -z "$found" ] && error "fid2path unable to get '$fid' path" + [ "$found" == "$tf" ] || + error "fid2path($fid=path2fid($tf)) = $found != $tf" } run_test 154A "lfs path2fid and fid2path basic checks" +test_154B() { + [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.4.1) ]] && + skip "Need MDS version at least 2.4.1" && return + + mkdir -p $DIR/$tdir || error "mkdir $tdir failed" + touch $DIR/$tdir/$tfile || error "touch $DIR/$tdir/$tfile failed" + local linkea=$($LL_DECODE_LINKEA $DIR/$tdir/$tfile | grep 'pfid') + [ -z "$linkea" ] && error "decode linkea $DIR/$tdir/$tfile failed" + + local name=$(echo $linkea | awk '/pfid/ {print $5}' | sed -e "s/'//g") + local PFID=$(echo $linkea | awk '/pfid/ {print $3}' | sed -e "s/,//g") + + # check that we get the same pathname + echo "PFID: $PFID, name: $name" + local FOUND=$($LFS fid2path $MOUNT "$PFID") + [ -z "$FOUND" ] && error "fid2path unable to get $PFID path" + [ "$FOUND/$name" != "$DIR/$tdir/$tfile" ] && + error "ll_decode_linkea has $FOUND/$name != $DIR/$tdir/$tfile" + + rm -rf $DIR/$tdir || error "Can not delete directory $DIR/$tdir" +} +run_test 154B "verify the ll_decode_linkea tool" + test_154a() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [[ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.2.51) ]] || { skip "Need MDS version at least 2.2.51"; return 0; } [ -z "$(which setfacl)" ] && skip "must have setfacl tool" && return + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return cp /etc/hosts $DIR/$tfile @@ -9964,6 +10214,7 @@ test_154b() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [[ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.2.51) ]] || { skip "Need MDS version at least 2.2.51"; return 0; } + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return @@ -10016,6 +10267,7 @@ test_154c() { run_test 154c "lfs path2fid and fid2path multiple arguments" test_154d() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.5.53) ]] && skip "Need MDS version at least 2.5.53" && return @@ -10060,6 +10312,7 @@ test_154e() run_test 154e ".lustre is not returned by readdir" test_154f() { + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return # create parent directory on a single MDT to avoid cross-MDT hardlinks test_mkdir -p -c1 $DIR/$tdir/d # test dirs inherit from its stripe @@ -10132,6 +10385,7 @@ test_154f() { rm -f $DIR/f restore_lustre_params < $save + rm -f $save } run_test 154f "get parent fids by reading link ea" @@ -10139,6 +10393,7 @@ test_154g() { [[ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.6.92) ]] || { skip "Need MDS version at least 2.6.92"; return 0; } + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return mkdir -p $DIR/$tdir llapi_fid_test -d $DIR/$tdir @@ -10201,67 +10456,114 @@ test_155_big_load() { true } +save_writethrough() { + local facets=$(get_facets OST) + + save_lustre_params $facets "obdfilter.*.writethrough_cache_enable" > $1 + save_lustre_params $facets "osd-*.*.writethrough_cache_enable" >> $1 +} + test_155a() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read on set_cache writethrough on test_155_small_load + restore_lustre_params < $p + rm -f $p } run_test 155a "Verify small file correctness: read cache:on write_cache:on" test_155b() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read on set_cache writethrough off test_155_small_load + restore_lustre_params < $p + rm -f $p } run_test 155b "Verify small file correctness: read cache:on write_cache:off" test_155c() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read off set_cache writethrough on test_155_small_load + restore_lustre_params < $p + rm -f $p } run_test 155c "Verify small file correctness: read cache:off write_cache:on" test_155d() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read off set_cache writethrough off test_155_small_load + restore_lustre_params < $p + rm -f $p } run_test 155d "Verify small file correctness: read cache:off write_cache:off" test_155e() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read on set_cache writethrough on test_155_big_load + restore_lustre_params < $p + rm -f $p } run_test 155e "Verify big file correctness: read cache:on write_cache:on" test_155f() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read on set_cache writethrough off test_155_big_load + restore_lustre_params < $p + rm -f $p } run_test 155f "Verify big file correctness: read cache:on write_cache:off" test_155g() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read off set_cache writethrough on test_155_big_load + restore_lustre_params < $p + rm -f $p } run_test 155g "Verify big file correctness: read cache:off write_cache:on" test_155h() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache read off set_cache writethrough off test_155_big_load + restore_lustre_params < $p + rm -f $p } run_test 155h "Verify big file correctness: read cache:off write_cache:off" @@ -10272,12 +10574,14 @@ test_156() { local BEFORE local AFTER local file="$DIR/$tfile" + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" [ "$(facet_fstype ost1)" = "zfs" -a \ $(lustre_version_code ost1 -lt $(version_code 2.6.93)) ] && skip "LU-1956/LU-2261: stats not implemented on OSD ZFS" && return + save_writethrough $p roc_hit_init log "Turn on read and write cache" @@ -10406,10 +10710,18 @@ test_156() { fi rm -f $file + restore_lustre_params < $p + rm -f $p } run_test 156 "Verification of tunables" #Changelogs +cleanup_changelog () { + trap 0 + echo "Deregistering changelog client $CL_USER" + do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister $CL_USER +} + err17935 () { if [[ $MDSCOUNT -gt 1 ]]; then error_ignore bz17935 $* @@ -10450,10 +10762,12 @@ test_160a() { local CL_USERS="mdd.$MDT0.changelog_users" local GET_CL_USERS="do_facet $SINGLEMDS $LCTL get_param -n $CL_USERS" - USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_register -n) - echo "Registered as changelog user $USER" - $GET_CL_USERS | grep -q $USER || - error "User $USER not found in changelog_users" + CL_USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ + changelog_register -n) + echo "Registered as changelog user $CL_USER" + trap cleanup_changelog EXIT + $GET_CL_USERS | grep -q $CL_USER || + error "User $CL_USER not found in changelog_users" # change something test_mkdir -p $DIR/$tdir/pics/2008/zachy @@ -10497,9 +10811,9 @@ test_160a() { [ "$fidc" == "$fidf" ] || err17935 "pfid in changelog $fidc != dir fid $fidf" - USER_REC1=$($GET_CL_USERS | awk "\$1 == \"$USER\" {print \$2}") - $LFS changelog_clear $MDT0 $USER $(($USER_REC1 + 5)) - USER_REC2=$($GET_CL_USERS | awk "\$1 == \"$USER\" {print \$2}") + USER_REC1=$($GET_CL_USERS | awk "\$1 == \"$CL_USER\" {print \$2}") + $LFS changelog_clear $MDT0 $CL_USER $(($USER_REC1 + 5)) + USER_REC2=$($GET_CL_USERS | awk "\$1 == \"$CL_USER\" {print \$2}") echo "verifying user clear: $(( $USER_REC1 + 5 )) == $USER_REC2" [ $USER_REC2 == $(($USER_REC1 + 5)) ] || err17935 "user index expected $(($USER_REC1 + 5)) is $USER_REC2" @@ -10514,7 +10828,7 @@ test_160a() { # LU-3446 changelog index reset on MDT restart local MDT_DEV=$(mdsdevname ${SINGLEMDS//mds/}) CUR_REC1=$($GET_CL_USERS | head -n1 | cut -f3 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 stop $SINGLEMDS || error "Fail to stop MDT." start $SINGLEMDS $MDT_DEV $MDS_MOUNT_OPTS || error "Fail to start MDT." CUR_REC2=$($GET_CL_USERS | head -n1 | cut -f3 -d' ') @@ -10523,19 +10837,19 @@ test_160a() { err17935 "current index should be $CUR_REC1 is $CUR_REC2" echo "verifying user deregister" - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister $USER - $GET_CL_USERS | grep -q $USER && - error "User $USER still in changelog_users" + cleanup_changelog + $GET_CL_USERS | grep -q $CL_USER && + error "User $CL_USER still in changelog_users" USERS=$(( $($GET_CL_USERS | wc -l) - 2 )) - if [ $USERS -eq 0 ]; then + if [ $CL_USER -eq 0 ]; then LAST_REC1=$($GET_CL_USERS | head -n1 | cut -f3 -d' ') touch $DIR/$tdir/chloe LAST_REC2=$($GET_CL_USERS | head -n1 | cut -f3 -d' ') echo "verify changelogs are off: $LAST_REC1 == $LAST_REC2" [ $LAST_REC1 == $LAST_REC2 ] || error "changelogs not off" else - echo "$USERS other changelog users; can't verify off" + echo "$CL_USER other changelog users; can't verify off" fi } run_test 160a "changelog sanity" @@ -10548,10 +10862,12 @@ test_160b() { # LU-3587 local CL_USERS="mdd.$MDT0.changelog_users" local GET_CL_USERS="do_facet $SINGLEMDS $LCTL get_param -n $CL_USERS" - USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_register -n) - echo "Registered as changelog user $USER" - $GET_CL_USERS | grep -q $USER || - error "User $USER not found in changelog_users" + CL_USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ + changelog_register -n) + echo "Registered as changelog user $CL_USER" + trap cleanup_changelog EXIT + $GET_CL_USERS | grep -q $CL_USER || + error "User $CL_USER not found in changelog_users" local LONGNAME1=$(str_repeat a 255) local LONGNAME2=$(str_repeat b 255) @@ -10563,11 +10879,8 @@ test_160b() { # LU-3587 mv $LONGNAME1 $LONGNAME2 $LFS changelog $MDT0 | grep RENME - - echo "deregistering $USER" - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister $USER - rm -f $LONGNAME2 + cleanup_changelog } run_test 160b "Verify that very long rename doesn't crash in changelog" @@ -10584,8 +10897,9 @@ test_160c() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return # Registration step - local USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ + CL_USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ changelog_register -n) + trap cleanup_changelog EXIT rm -rf $DIR/$tdir mkdir -p $DIR/$tdir @@ -10597,11 +10911,10 @@ test_160c() { $LFS changelog $MDT0 TRUNCS=$($LFS changelog $MDT0 | tail -5 | grep -c "TRUNC") [ $TRUNCS -eq 1 ] || err17935 "TRUNC changelog mask count $TRUNCS != 1" - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 # Deregistration step - echo "deregistering $USER" - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister $USER + cleanup_changelog } run_test 160c "verify that changelog log catch the truncate event" @@ -10617,21 +10930,22 @@ test_160d() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return # Registration step - local USER=$(do_facet mds1 $LCTL --device $MDT0 \ + CL_USER=$(do_facet mds1 $LCTL --device $MDT0 \ changelog_register -n) + trap cleanup_changelog EXIT mkdir -p $DIR/$tdir/migrate_dir - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 $LFS migrate -m 1 $DIR/$tdir/migrate_dir || error "migrate fails" $LFS changelog $MDT0 MIGRATES=$($LFS changelog $MDT0 | tail -5 | grep -c "MIGRT") - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 [ $MIGRATES -eq 1 ] || error "MIGRATE changelog mask count $MIGRATES != 1" # Deregistration step - do_facet mds1 $LCTL --device $MDT0 changelog_deregister $USER + cleanup_changelog } run_test 160d "verify that changelog log catch the migrate event" @@ -10680,8 +10994,7 @@ run_test 161a "link ea sanity" test_161b() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - [ $MDSCOUNT -lt 2 ] && - skip "skipping remote directory test" && return + [ $MDSCOUNT -lt 2 ] && skip "skipping remote directory test" && return local MDTIDX=1 local remote_dir=$DIR/$tdir/remote_dir @@ -10739,8 +11052,10 @@ test_161c() { # define CLF_RENAME_LAST 0x0001 # rename overwrite a target having nlink = 1 (changelog flag 0x1) - local USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ + CL_USER=$(do_facet $SINGLEMDS $LCTL --device $MDT0 \ changelog_register -n) + + trap cleanup_changelog EXIT rm -rf $DIR/$tdir mkdir -p $DIR/$tdir touch $DIR/$tdir/foo_161c @@ -10749,10 +11064,8 @@ test_161c() { $LFS changelog $MDT0 | grep RENME local flags=$($LFS changelog $MDT0 | grep RENME | tail -1 | \ cut -f5 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 if [ x$flags != "x0x1" ]; then - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister \ - $USER error "flag $flags is not 0x1" fi echo "rename overwrite a target having nlink = 1," \ @@ -10765,10 +11078,8 @@ test_161c() { mv -f $DIR/$tdir/foo_161c $DIR/$tdir/bar_161c $LFS changelog $MDT0 | grep RENME flags=$($LFS changelog $MDT0 | grep RENME | tail -1 | cut -f5 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 if [ x$flags != "x0x0" ]; then - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister \ - $USER error "flag $flags is not 0x0" fi echo "rename overwrite a target having nlink > 1," \ @@ -10779,10 +11090,8 @@ test_161c() { mv -f $DIR/$tdir/foo_161c $DIR/$tdir/foo2_161c $LFS changelog $MDT0 | grep RENME flags=$($LFS changelog $MDT0 | grep RENME | tail -1 | cut -f5 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 if [ x$flags != "x0x0" ]; then - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister \ - $USER error "flag $flags is not 0x0" fi echo "rename doesn't overwrite a target," \ @@ -10793,10 +11102,8 @@ test_161c() { rm -f $DIR/$tdir/foo2_161c $LFS changelog $MDT0 | grep UNLNK flags=$($LFS changelog $MDT0 | grep UNLNK | tail -1 | cut -f5 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 if [ x$flags != "x0x1" ]; then - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister \ - $USER error "flag $flags is not 0x1" fi echo "unlink a file having nlink = 1," \ @@ -10807,15 +11114,13 @@ test_161c() { rm -f $DIR/$tdir/foobar_161c $LFS changelog $MDT0 | grep UNLNK flags=$($LFS changelog $MDT0 | grep UNLNK | tail -1 | cut -f5 -d' ') - $LFS changelog_clear $MDT0 $USER 0 + $LFS changelog_clear $MDT0 $CL_USER 0 if [ x$flags != "x0x0" ]; then - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister \ - $USER error "flag $flags is not 0x0" fi echo "unlink a file having nlink > 1," \ "changelog record has flags of $flags" - do_facet $SINGLEMDS $LCTL --device $MDT0 changelog_deregister $USER + cleanup_changelog } run_test 161c "check CL_RENME[UNLINK] changelog record flags" @@ -11303,6 +11608,8 @@ test_184b() { run_test 184b "Forbidden layout swap (will generate errors)" test_184c() { + local cmpn_arg=$(cmp -n 2>&1 | grep "invalid option") + [ -n "$cmpn_arg" ] && skip_env "cmp does not support -n" && return check_swap_layouts_support && return 0 local dir0=$DIR/$tdir/$testnum @@ -11427,6 +11734,7 @@ test_185() { # LU-2441 local mtime1=$(stat -c "%Y" $DIR/$tdir) local fid=$($MULTIOP $DIR/$tdir VFw4096c) || error "cannot create/write a volatile file" + [ "$FILESET" == "" ] && $CHECKSTAT -t file $MOUNT/.lustre/fid/$fid 2>/dev/null && error "FID is still valid after close" @@ -11441,8 +11749,10 @@ test_185() { # LU-2441 # is unfortunately eaten by multiop_bg_pause local n=$((${fidv[1]} + 1)) local next_fid="${fidv[0]}:$(printf "0x%x" $n):${fidv[2]}" - $CHECKSTAT -t file $MOUNT/.lustre/fid/$next_fid || - error "FID is missing before close" + if [ "$FILESET" == "" ]; then + $CHECKSTAT -t file $MOUNT/.lustre/fid/$next_fid || + error "FID is missing before close" + fi kill -USR1 $multi_pid # 1 second delay, so if mtime change we will see it sleep 1 @@ -11493,6 +11803,7 @@ run_test 187b "Test data version change on volatile file" test_200() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return remote_mgs_nodsh && skip "remote MGS with nodsh" && return + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return local POOL=${POOL:-cea1} local POOL_ROOT=${POOL_ROOT:-$DIR/d200.pools} @@ -11731,10 +12042,11 @@ jobstats_set() { } cleanup_205() { + trap 0 do_facet $SINGLEMDS \ $LCTL set_param mdt.*.job_cleanup_interval=$OLD_INTERVAL [ $OLD_JOBENV != $JOBENV ] && jobstats_set $OLD_JOBENV - do_facet $SINGLEMDS lctl --device $MDT0 changelog_deregister $CL_USER + cleanup_changelog } test_205() { # Job stats @@ -11792,6 +12104,7 @@ test_205() { # Job stats cmd="dd if=/dev/zero of=$DIR/$tfile bs=1M count=1 oflag=sync" verify_jobstats "$cmd" "ost1" # read + cancel_lru_locks osc cmd="dd if=$DIR/$tfile of=/dev/null bs=1M count=1 iflag=direct" verify_jobstats "$cmd" "ost1" # truncate @@ -11801,8 +12114,10 @@ test_205() { # Job stats cmd="mv -f $DIR/$tfile $DIR/$tdir.rename" verify_jobstats "$cmd" "$SINGLEMDS" # jobstats expiry - sleep until old stats should be expired - local left=$((interval_new + 2 - (SECONDS - start))) - [ $left -ge 0 ] && echo "sleep $left for expiry" && sleep $((left + 1)) + local left=$((interval_new + 5 - (SECONDS - start))) + [ $left -ge 0 ] && wait_update_facet $SINGLEMDS \ + "lctl get_param *.*.job_stats | grep -c 'job_id.*mkdir'" \ + "0" $left cmd="mkdir $DIR/$tdir.expire" verify_jobstats "$cmd" "$SINGLEMDS" [ $(do_facet $SINGLEMDS lctl get_param *.*.job_stats | @@ -12297,16 +12612,16 @@ run_test 222a "AGL for ls should not trigger CLIO lock failure ================" test_222b () { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return - rm -rf $DIR/$tdir - test_mkdir -p $DIR/$tdir - $SETSTRIPE -c 1 -i 0 $DIR/$tdir - createmany -o $DIR/$tdir/$tfile 10 - cancel_lru_locks mdc - cancel_lru_locks osc - #define OBD_FAIL_LDLM_AGL_DELAY 0x31a - $LCTL set_param fail_loc=0x31a - rm -r $DIR/$tdir || "AGL for rmdir failed" - $LCTL set_param fail_loc=0 + rm -rf $DIR/$tdir + test_mkdir -p $DIR/$tdir + $SETSTRIPE -c 1 -i 0 $DIR/$tdir + createmany -o $DIR/$tdir/$tfile 10 + cancel_lru_locks mdc + cancel_lru_locks osc + #define OBD_FAIL_LDLM_AGL_DELAY 0x31a + $LCTL set_param fail_loc=0x31a + rm -r $DIR/$tdir || error "AGL for rmdir failed" + $LCTL set_param fail_loc=0 } run_test 222b "AGL for rmdir should not trigger CLIO lock failure =============" @@ -12350,6 +12665,12 @@ run_test 224b "Don't panic on bulk IO failure" test_224c() { # LU-6441 [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return + + local p="$TMP/$TESTSUITE-$TESTNAME.parameters" + save_writethrough $p + set_cache writethrough on + local pages_per_rpc=$($LCTL get_param \ osc.*.max_pages_per_rpc) local at_max=$($LCTL get_param -n at_max) @@ -12367,10 +12688,11 @@ test_224c() { # LU-6441 error "conf_param timeout=5 failed" #define OBD_FAIL_PTLRPC_CLIENT_BULK_CB3 0x520 - $LCTL set_param fail_loc=0x520 + do_facet ost1 $LCTL set_param fail_loc=0x520 + $LFS setstripe -c 1 -i 0 $DIR/$tfile dd if=/dev/zero of=$DIR/$tfile bs=8MB count=1 sync - $LCTL set_param fail_loc=0 + do_facet ost1 $LCTL set_param fail_loc=0 set_conf_param_and_check client "$test_at" "$param_at" $at_max || error "conf_param at_max=$at_max failed" @@ -12378,6 +12700,8 @@ test_224c() { # LU-6441 $timeout || error "conf_param timeout=$timeout failed" $LCTL set_param -n $pages_per_rpc + restore_lustre_params < $p + rm -f $p } run_test 224c "Don't hang if one of md lost during large bulk RPC" @@ -13031,7 +13355,7 @@ test_230f() { # a should be migrated to MDT1, since no other links on MDT0 $LFS migrate -m 1 $DIR/$tdir/migrate_dir || - error "migrate dir fails" + error "#1 migrate dir fails" mdt_index=$($LFS getstripe -M $DIR/$tdir/migrate_dir) [ $mdt_index == 1 ] || error "migrate_dir is not on MDT1" mdt_index=$($LFS getstripe -M $DIR/$tdir/migrate_dir/a) @@ -13039,12 +13363,12 @@ test_230f() { # a should stay on MDT1, because it is a mulitple link file $LFS migrate -m 0 $DIR/$tdir/migrate_dir || - error "migrate dir fails" + error "#2 migrate dir fails" mdt_index=$($LFS getstripe -M $DIR/$tdir/migrate_dir/a) [ $mdt_index == 1 ] || error "a is not on MDT1" $LFS migrate -m 1 $DIR/$tdir/migrate_dir || - error "migrate dir fails" + error "#3 migrate dir fails" a_fid=$($LFS path2fid $DIR/$tdir/migrate_dir/a) ln_fid=$($LFS path2fid $DIR/$tdir/other_dir/ln1) @@ -13055,7 +13379,7 @@ test_230f() { # a should be migrated to MDT0, since no other links on MDT1 $LFS migrate -m 0 $DIR/$tdir/migrate_dir || - error "migrate dir fails" + error "#4 migrate dir fails" mdt_index=$($LFS getstripe -M $DIR/$tdir/migrate_dir/a) [ $mdt_index == 0 ] || error "a is not on MDT0" @@ -13102,6 +13426,20 @@ test_230h() { } run_test 230h "migrate .. and root" +test_230i() { + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + + mkdir -p $DIR/$tdir/migrate_dir + + $LFS migrate -m 1 $DIR/$tdir/migrate_dir/ || + error "migration fails with a tailing slash" + + $LFS migrate -m 0 $DIR/$tdir/migrate_dir// || + error "migration fails with two tailing slashes" +} +run_test 230i "lfs migrate -m tolerates trailing slashes" + test_231a() { # For simplicity this test assumes that max_pages_per_rpc @@ -13174,6 +13512,7 @@ run_test 232 "failed lock should not block umount" test_233a() { [ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.3.64) ] || { skip "Need MDS version at least 2.3.64"; return; } + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return local fid=$($LFS path2fid $MOUNT) stat $MOUNT/.lustre/fid/$fid > /dev/null || @@ -13184,6 +13523,7 @@ run_test 233a "checking that OBF of the FS root succeeds" test_233b() { [ $(lustre_version_code $SINGLEMDS) -ge $(version_code 2.5.90) ] || { skip "Need MDS version at least 2.5.90"; return; } + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return local fid=$($LFS path2fid $MOUNT/.lustre) stat $MOUNT/.lustre/fid/$fid > /dev/null || @@ -13321,6 +13661,7 @@ test_239() { run_test 239 "osp_sync test" test_239a() { #LU-5297 + remote_mds_nodsh && skip "remote MDS with nodsh" && return touch $DIR/$tfile #define OBD_FAIL_OSP_CHECK_INVALID_REC 0x2100 do_facet $SINGLEMDS $LCTL set_param fail_loc=0x2100 @@ -13330,6 +13671,7 @@ test_239a() { #LU-5297 run_test 239a "process invalid osp sync record correctly" test_239b() { #LU-5297 + remote_mds_nodsh && skip "remote MDS with nodsh" && return touch $DIR/$tfile1 #define OBD_FAIL_OSP_CHECK_ENOMEM 0x2101 do_facet $SINGLEMDS $LCTL set_param fail_loc=0x2101 @@ -13344,6 +13686,7 @@ run_test 239b "process osp sync record with ENOMEM error correctly" test_240() { [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return mkdir -p $DIR/$tdir @@ -13376,7 +13719,7 @@ test_241_dio() { done } -test_241() { +test_241a() { # was test_241 dd if=/dev/zero of=$DIR/$tfile count=1 bs=40960 ls -la $DIR/$tfile cancel_lru_locks osc @@ -13385,7 +13728,7 @@ test_241() { test_241_dio 1000 wait $PID } -run_test 241 "bio vs dio" +run_test 241a "bio vs dio" test_241b() { dd if=/dev/zero of=$DIR/$tfile count=1 bs=40960 @@ -13398,6 +13741,7 @@ test_241b() { run_test 241b "dio vs dio" test_242() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return mkdir -p $DIR/$tdir touch $DIR/$tdir/$tfile @@ -13453,6 +13797,7 @@ test_245() { run_test 245 "check mdc connection flag/data: multiple modify RPCs" test_246() { # LU-7371 + remote_ost_nodsh && skip "remote OST with nodsh" && return [ $(lustre_version_code ost1) -lt $(version_code 2.7.62) ] && skip "Need OST version >= 2.7.62" && return 0 do_facet ost1 $LCTL set_param fail_val=4095 @@ -13465,6 +13810,153 @@ test_246() { # LU-7371 } run_test 246 "Read file of size 4095 should return right length" +test_247a() { + lctl get_param -n mdc.$FSNAME-MDT0000*.import | + grep -q subtree || + { skip "Fileset feature is not supported"; return; } + + local submount=${MOUNT}_$tdir + + mkdir $MOUNT/$tdir + mkdir -p $submount || error "mkdir $submount failed" + FILESET="$FILESET/$tdir" mount_client $submount || + error "mount $submount failed" + echo foo > $submount/$tfile || error "write $submount/$tfile failed" + [ $(cat $MOUNT/$tdir/$tfile) = "foo" ] || + error "read $MOUNT/$tdir/$tfile failed" + umount_client $submount || error "umount $submount failed" + rmdir $submount +} +run_test 247a "mount subdir as fileset" + +test_247b() { + lctl get_param -n mdc.$FSNAME-MDT0000*.import | grep -q subtree || + { skip "Fileset feature is not supported"; return; } + + local submount=${MOUNT}_$tdir + + rm -rf $MOUNT/$tdir + mkdir -p $submount || error "mkdir $submount failed" + SKIP_FILESET=1 + FILESET="$FILESET/$tdir" mount_client $submount && + error "mount $submount should fail" + rmdir $submount +} +run_test 247b "mount subdir that dose not exist" + +test_247c() { + lctl get_param -n mdc.$FSNAME-MDT0000*.import | grep -q subtree || + { skip "Fileset feature is not supported"; return; } + + local submount=${MOUNT}_$tdir + + mkdir -p $MOUNT/$tdir/dir1 + mkdir -p $submount || error "mkdir $submount failed" + FILESET="$FILESET/$tdir" mount_client $submount || + error "mount $submount failed" + local fid=$($LFS path2fid $MOUNT/) + $LFS fid2path $submount $fid && error "fid2path should fail" + umount_client $submount || error "umount $submount failed" + rmdir $submount +} +run_test 247c "running fid2path outside root" + +test_247d() { + lctl get_param -n mdc.$FSNAME-MDT0000*.import | grep -q subtree || + { skip "Fileset feature is not supported"; return; } + + local submount=${MOUNT}_$tdir + + mkdir -p $MOUNT/$tdir/dir1 + mkdir -p $submount || error "mkdir $submount failed" + FILESET="$FILESET/$tdir" mount_client $submount || + error "mount $submount failed" + local fid=$($LFS path2fid $submount/dir1) + $LFS fid2path $submount $fid || error "fid2path should succeed" + umount_client $submount || error "umount $submount failed" + rmdir $submount +} +run_test 247d "running fid2path inside root" + +# LU-8037 +test_247e() { + lctl get_param -n mdc.$FSNAME-MDT0000*.import | + grep -q subtree || + { skip "Fileset feature is not supported"; return; } + + local submount=${MOUNT}_$tdir + + mkdir $MOUNT/$tdir + mkdir -p $submount || error "mkdir $submount failed" + FILESET="$FILESET/.." mount_client $submount && + error "mount $submount should fail" + rmdir $submount +} +run_test 247e "mount .. as fileset" + +test_248() { + local fast_read_sav=$($LCTL get_param -n llite.*.fast_read 2>/dev/null) + [ -z "$fast_read_sav" ] && skip "no fast read support" && return + + # create a large file for fast read verification + dd if=/dev/zero of=$DIR/$tfile bs=1M count=128 > /dev/null 2>&1 + + # make sure the file is created correctly + $CHECKSTAT -s $((128*1024*1024)) $DIR/$tfile || + { rm -f $DIR/$tfile; skip "file creation error" && return; } + + echo "Test 1: verify that fast read is 4 times faster on cache read" + + # small read with fast read enabled + $LCTL set_param -n llite.*.fast_read=1 + local t_fast=$(dd if=$DIR/$tfile of=/dev/null bs=4k 2>&1 | + awk '/copied/ { print $6 }') + + # small read with fast read disabled + $LCTL set_param -n llite.*.fast_read=0 + local t_slow=$(dd if=$DIR/$tfile of=/dev/null bs=4k 2>&1 | + awk '/copied/ { print $6 }') + + # verify that fast read is 4 times faster for cache read + [ $(bc <<< "4 * $t_fast < $t_slow") -eq 1 ] || + error_not_in_vm "fast read was not 4 times faster: " \ + "$t_fast vs $t_slow" + + echo "Test 2: verify the performance between big and small read" + $LCTL set_param -n llite.*.fast_read=1 + + # 1k non-cache read + cancel_lru_locks osc + local t_1k=$(dd if=$DIR/$tfile of=/dev/null bs=1k 2>&1 | + awk '/copied/ { print $6 }') + + # 1M non-cache read + cancel_lru_locks osc + local t_1m=$(dd if=$DIR/$tfile of=/dev/null bs=1k 2>&1 | + awk '/copied/ { print $6 }') + + # verify that big IO is not 4 times faster than small IO + [ $(bc <<< "4 * $t_1k >= $t_1m") -eq 1 ] || + error_not_in_vm "bigger IO is way too fast: $t_1k vs $t_1m" + + $LCTL set_param -n llite.*.fast_read=$fast_read_sav + rm -f $DIR/$tfile +} +run_test 248 "fast read verification" + +test_249() { # LU-7890 + rm -f $DIR/$tfile + $SETSTRIPE -c 1 $DIR/$tfile + + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.53) ] && + skip "Need at least version 2.8.54" + + # Offset 2T == 4k * 512M + dd if=/dev/zero of=$DIR/$tfile bs=4k count=1 seek=512M || + error "dd to 2T offset failed" +} +run_test 249 "Write above 2T file size" + test_250() { [ "$(facet_fstype ost$(($($GETSTRIPE -i $DIR/$tfile) + 1)))" = "zfs" ] \ && skip "no 16TB file size limit on ZFS" && return @@ -13504,6 +13996,8 @@ test_252() { local num local gen + remote_mds_nodsh && skip "remote MDS with nodsh" && return + remote_ost_nodsh && skip "remote OST with nodsh" && return if [ "$(facet_fstype ost1)" != "ldiskfs" -o \ "$(facet_fstype mds1)" != "ldiskfs" ]; then skip "can only run lr_reader on ldiskfs target" @@ -13547,6 +14041,499 @@ test_252() { } run_test 252 "check lr_reader tool" +test_253_fill_ost() { + local size_mb #how many MB should we write to pass watermark + local lwm=$3 #low watermark + local free_10mb #10% of free space + + free_kb=$($LFS df $MOUNT | grep $1 | awk '{ print $4 }') + size_mb=$((free_kb / 1024 - lwm)) + free_10mb=$((free_kb / 10240)) + #If 10% of free space cross low watermark use it + if (( free_10mb > size_mb )); then + size_mb=$free_10mb + else + #At least we need to store 1.1 of difference between + #free space and low watermark + size_mb=$((size_mb + size_mb / 10)) + fi + if (( lwm <= $((free_kb / 1024)) )) || [ ! -f $DIR/$tdir/1 ]; then + dd if=/dev/zero of=$DIR/$tdir/1 bs=1M count=$size_mb \ + oflag=append conv=notrunc + fi + + sleep_maxage + + free_kb=$($LFS df $MOUNT | grep $1 | awk '{ print $4 }') + echo "OST still has $((free_kb / 1024)) mbytes free" +} + +test_253() { + local ostidx=0 + local rc=0 + + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return + remote_mgs_nodsh && skip "remote MGS with nodsh" && return + + local ost_name=$($LFS osts | grep ${ostidx}": " | \ + awk '{print $2}' | sed -e 's/_UUID$//') + # on the mdt's osc + local mdtosc_proc1=$(get_mdtosc_proc_path $SINGLEMDS $ost_name) + do_facet $SINGLEMDS $LCTL get_param -n \ + osp.$mdtosc_proc1.reserved_mb_high || + { skip "remote MDS does not support reserved_mb_high" && + return; } + + rm -rf $DIR/$tdir + wait_mds_ost_sync + wait_delete_completed + mkdir $DIR/$tdir + + local last_wm_h=$(do_facet $SINGLEMDS $LCTL get_param -n \ + osp.$mdtosc_proc1.reserved_mb_high) + local last_wm_l=$(do_facet $SINGLEMDS $LCTL get_param -n \ + osp.$mdtosc_proc1.reserved_mb_low) + echo "prev high watermark $last_wm_h, prev low watermark $last_wm_l" + + do_facet mgs $LCTL pool_new $FSNAME.$TESTNAME || + error "Pool creation failed" + do_facet mgs $LCTL pool_add $FSNAME.$TESTNAME $ost_name || + error "Adding $ost_name to pool failed" + + # Wait for client to see a OST at pool + wait_update $HOSTNAME "$LCTL get_param -n + lov.$FSNAME-*.pools.$TESTNAME | sort -u | + grep $ost_name" "$ost_name""_UUID" $((TIMEOUT/2)) || + error "Client can not see the pool" + $SETSTRIPE $DIR/$tdir -i $ostidx -c 1 -p $FSNAME.$TESTNAME || + error "Setstripe failed" + + dd if=/dev/zero of=$DIR/$tdir/0 bs=1M count=10 + local blocks=$($LFS df $MOUNT | grep $ost_name | awk '{ print $4 }') + echo "OST still has $((blocks/1024)) mbytes free" + + local new_lwm=$((blocks/1024-10)) + do_facet $SINGLEMDS $LCTL set_param \ + osp.$mdtosc_proc1.reserved_mb_high=$((new_lwm+5)) + do_facet $SINGLEMDS $LCTL set_param \ + osp.$mdtosc_proc1.reserved_mb_low=$new_lwm + + test_253_fill_ost $ost_name $mdtosc_proc1 $new_lwm + + #First enospc could execute orphan deletion so repeat. + test_253_fill_ost $ost_name $mdtosc_proc1 $new_lwm + + local oa_status=$(do_facet $SINGLEMDS $LCTL get_param -n \ + osp.$mdtosc_proc1.prealloc_status) + echo "prealloc_status $oa_status" + + dd if=/dev/zero of=$DIR/$tdir/2 bs=1M count=1 && + error "File creation should fail" + #object allocation was stopped, but we still able to append files + dd if=/dev/zero of=$DIR/$tdir/1 bs=1M seek=6 count=5 oflag=append || + error "Append failed" + rm -f $DIR/$tdir/1 $DIR/$tdir/0 $DIR/$tdir/r* + + wait_delete_completed + + sleep_maxage + + for i in $(seq 10 12); do + dd if=/dev/zero of=$DIR/$tdir/$i bs=1M count=1 2>/dev/null || + error "File creation failed after rm"; + done + + oa_status=$(do_facet $SINGLEMDS $LCTL get_param -n \ + osp.$mdtosc_proc1.prealloc_status) + echo "prealloc_status $oa_status" + + if (( oa_status != 0 )); then + error "Object allocation still disable after rm" + fi + do_facet $SINGLEMDS $LCTL set_param \ + osp.$mdtosc_proc1.reserved_mb_high=$last_wm_h + do_facet $SINGLEMDS $LCTL set_param \ + osp.$mdtosc_proc1.reserved_mb_low=$last_wm_l + + + do_facet mgs $LCTL pool_remove $FSNAME.$TESTNAME $ost_name || + error "Remove $ost_name from pool failed" + do_facet mgs $LCTL pool_destroy $FSNAME.$TESTNAME || + error "Pool destroy fialed" +} +run_test 253 "Check object allocation limit" + +test_254() { + local cl_user + + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return + do_facet mds1 $LCTL get_param -n mdd.$MDT0.changelog_size || + { skip "MDS does not support changelog_size" && return; } + + cl_user=$(do_facet mds1 $LCTL --device $MDT0 changelog_register -n) + echo "Registered as changelog user $cl_user" + + $LFS changelog_clear $MDT0 $cl_user 0 + + local size1=$(do_facet mds1 \ + $LCTL get_param -n mdd.$MDT0.changelog_size) + echo "Changelog size $size1" + + rm -rf $DIR/$tdir + $LFS mkdir -i 0 $DIR/$tdir + # change something + mkdir -p $DIR/$tdir/pics/2008/zachy + touch $DIR/$tdir/pics/2008/zachy/timestamp + cp /etc/hosts $DIR/$tdir/pics/2008/zachy/pic1.jpg + mv $DIR/$tdir/pics/2008/zachy $DIR/$tdir/pics/zach + ln $DIR/$tdir/pics/zach/pic1.jpg $DIR/$tdir/pics/2008/portland.jpg + ln -s $DIR/$tdir/pics/2008/portland.jpg $DIR/$tdir/pics/desktop.jpg + rm $DIR/$tdir/pics/desktop.jpg + + local size2=$(do_facet mds1 \ + $LCTL get_param -n mdd.$MDT0.changelog_size) + echo "Changelog size after work $size2" + + do_facet mds1 $LCTL --device $MDT0 changelog_deregister $cl_user + + if (( size2 <= size1 )); then + error "Changelog size after work should be greater than original" + fi + return 0 +} +run_test 254 "Check changelog size" + +ladvise_no_type() +{ + local type=$1 + local file=$2 + + lfs ladvise -a invalid $file 2>&1 | grep "Valid types" | + awk -F: '{print $2}' | grep $type > /dev/null + if [ $? -ne 0 ]; then + return 0 + fi + return 1 +} + +ladvise_no_ioctl() +{ + local file=$1 + + lfs ladvise -a willread $file > /dev/null 2>&1 + if [ $? -eq 0 ]; then + return 1 + fi + + lfs ladvise -a willread $file 2>&1 | + grep "Inappropriate ioctl for device" > /dev/null + if [ $? -eq 0 ]; then + return 0 + fi + return 1 +} + +ladvise_willread_performance() +{ + local repeat=10 + local average_cache=0 + local average_ladvise=0 + + for ((i = 1; i <= $repeat; i++)); do + echo "Iter $i/$repeat: reading without willread hint" + cancel_lru_locks osc + do_nodes $(comma_list $(osts_nodes)) \ + "echo 3 > /proc/sys/vm/drop_caches" + local speed_origin=$($READS -f $DIR/$tfile -s $size \ + -b 4096 -n $((size / 4096)) -t 60 | + sed -e '/^$/d' -e 's#.*s, ##' -e 's#MB/s##') + + echo "Iter $i/$repeat: Reading again without willread hint" + cancel_lru_locks osc + local speed_cache=$($READS -f $DIR/$tfile -s $size \ + -b 4096 -n $((size / 4096)) -t 60 | + sed -e '/^$/d' -e 's#.*s, ##' -e 's#MB/s##') + + echo "Iter $i/$repeat: reading with willread hint" + cancel_lru_locks osc + do_nodes $(comma_list $(osts_nodes)) \ + "echo 3 > /proc/sys/vm/drop_caches" + lfs ladvise -a willread $DIR/$tfile || + error "Ladvise failed" + local speed_ladvise=$($READS -f $DIR/$tfile -s $size \ + -b 4096 -n $((size / 4096)) -t 60 | + sed -e '/^$/d' -e 's#.*s, ##' -e 's#MB/s##') + + local cache_speedup=$(echo "scale=2; \ + ($speed_cache-$speed_origin)/$speed_origin*100" | bc) + cache_speedup=$(echo ${cache_speedup%.*}) + echo "Iter $i/$repeat: cache speedup: $cache_speedup%" + average_cache=$((average_cache + cache_speedup)) + + local ladvise_speedup=$(echo "scale=2; \ + ($speed_ladvise-$speed_origin)/$speed_origin*100" | bc) + ladvise_speedup=$(echo ${ladvise_speedup%.*}) + echo "Iter $i/$repeat: ladvise speedup: $ladvise_speedup%" + average_ladvise=$((average_ladvise + ladvise_speedup)) + done + average_cache=$((average_cache / repeat)) + average_ladvise=$((average_ladvise / repeat)) + + if [ $average_cache -lt 20 ]; then + echo "Speedup with cache is less than 20% ($average_cache%),"\ + "skipping check of speedup with willread:"\ + "$average_ladvise%" + return 0 + fi + + local lowest_speedup=$((average_cache / 2)) + [ $average_ladvise -gt $lowest_speedup ] || + error_not_in_vm "Speedup with willread is less than " \ + "$lowest_speedup%, got $average_ladvise%" + echo "Speedup with willread ladvise: $average_ladvise%" + echo "Speedup with cache: $average_cache%" +} + +test_255a() { + lfs setstripe -c -1 -i 0 $DIR/$tfile || error "$tfile failed" + + ladvise_no_type willread $DIR/$tfile && + skip "willread ladvise is not supported" && return + + ladvise_no_ioctl $DIR/$tfile && + skip "ladvise ioctl is not supported" && return + + [ $(lustre_version_code ost1) -lt $(version_code 2.8.54) ] && + skip "lustre < 2.8.54 does not support ladvise " && return + + local size_mb=100 + local size=$((size_mb * 1048576)) + dd if=/dev/zero of=$DIR/$tfile bs=1048576 count=$size_mb || + error "dd to $DIR/$tfile failed" + + lfs ladvise -a willread $DIR/$tfile || + error "Ladvise failed with no range argument" + + lfs ladvise -a willread -s 0 $DIR/$tfile || + error "Ladvise failed with no -l or -e argument" + + lfs ladvise -a willread -e 1 $DIR/$tfile || + error "Ladvise failed with only -e argument" + + lfs ladvise -a willread -l 1 $DIR/$tfile || + error "Ladvise failed with only -l argument" + + lfs ladvise -a willread -s 2 -e 1 $DIR/$tfile && + error "End offset should not be smaller than start offset" + + lfs ladvise -a willread -s 2 -e 2 $DIR/$tfile && + error "End offset should not be equal to start offset" + + lfs ladvise -a willread -s $size -l 1 $DIR/$tfile || + error "Ladvise failed with overflowing -s argument" + + lfs ladvise -a willread -s 1 -e $((size + 1)) $DIR/$tfile || + error "Ladvise failed with overflowing -e argument" + + lfs ladvise -a willread -s 1 -l $size $DIR/$tfile || + error "Ladvise failed with overflowing -l argument" + + lfs ladvise -a willread -l 1 -e 2 $DIR/$tfile && + error "Ladvise succeeded with conflicting -l and -e arguments" + + echo "Synchronous ladvise should wait" + local delay=4 +#define OBD_FAIL_OST_LADVISE_PAUSE 0x237 + do_nodes $(comma_list $(osts_nodes)) \ + $LCTL set_param fail_val=$delay fail_loc=0x237 + + local start_ts=$SECONDS + lfs ladvise -a willread $DIR/$tfile || + error "Ladvise failed with no range argument" + local end_ts=$SECONDS + local inteval_ts=$((end_ts - start_ts)) + + if [ $inteval_ts -lt $(($delay - 1)) ]; then + error "Synchronous advice didn't wait reply" + fi + + echo "Asynchronous ladvise shouldn't wait" + local start_ts=$SECONDS + lfs ladvise -a willread -b $DIR/$tfile || + error "Ladvise failed with no range argument" + local end_ts=$SECONDS + local inteval_ts=$((end_ts - start_ts)) + + if [ $inteval_ts -gt $(($delay / 2)) ]; then + error "Asynchronous advice blocked" + fi + + do_nodes $(comma_list $(osts_nodes)) $LCTL set_param fail_loc=0 + ladvise_willread_performance +} +run_test 255a "check 'lfs ladvise -a willread'" + +facet_meminfo() { + local facet=$1 + local info=$2 + + do_facet $facet "cat /proc/meminfo | grep ^${info}:" | awk '{print $2}' +} + +test_255b() { + ladvise_no_type dontneed $DIR/$tfile && + skip "dontneed ladvise is not supported" && return + + ladvise_no_ioctl $DIR/$tfile && + skip "ladvise ioctl is not supported" && return + + [ $(lustre_version_code ost1) -lt $(version_code 2.8.54) ] && + skip "lustre < 2.8.54 does not support ladvise" && return + + [ "$(facet_fstype ost1)" = "zfs" ] && + skip "zfs-osd does not support dontneed advice" && return + + lfs setstripe -c 1 -i 0 $DIR/$tfile + + local size_mb=100 + local size=$((size_mb * 1048576)) + # In order to prevent disturbance of other processes, only check 3/4 + # of the memory usage + local kibibytes=$((size_mb * 1024 * 3 / 4)) + + dd if=/dev/zero of=$DIR/$tfile bs=1048576 count=$size_mb || + error "dd to $DIR/$tfile failed" + + local total=$(facet_meminfo ost1 MemTotal) + echo "Total memory: $total KiB" + + do_facet ost1 "sync && echo 3 > /proc/sys/vm/drop_caches" + local before_read=$(facet_meminfo ost1 Cached) + echo "Cache used before read: $before_read KiB" + + lfs ladvise -a willread $DIR/$tfile || + error "Ladvise willread failed" + local after_read=$(facet_meminfo ost1 Cached) + echo "Cache used after read: $after_read KiB" + + lfs ladvise -a dontneed $DIR/$tfile || + error "Ladvise dontneed again failed" + local no_read=$(facet_meminfo ost1 Cached) + echo "Cache used after dontneed ladvise: $no_read KiB" + + if [ $total -lt $((before_read + kibibytes)) ]; then + echo "Memory is too small, abort checking" + return 0 + fi + + if [ $((before_read + kibibytes)) -gt $after_read ]; then + error "Ladvise willread should use more memory" \ + "than $kibibytes KiB" + fi + + if [ $((no_read + kibibytes)) -gt $after_read ]; then + error "Ladvise dontneed should release more memory" \ + "than $kibibytes KiB" + fi +} +run_test 255b "check 'lfs ladvise -a dontneed'" + +test_256() { + local cl_user + local cat_sl + local mdt_dev + + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return + [ "$(facet_fstype mds1)" != "ldiskfs" ] && + skip "non-ldiskfs backend" && return + + mdt_dev=$(mdsdevname 1) + echo $mdt_dev + cl_user=$(do_facet mds1 \ + "$LCTL get_param -n mdd.$MDT0.changelog_users | grep cl") + if [[ -n $cl_user ]]; then + skip "active changelog user" + return + fi + + cl_user=$(do_facet mds1 $LCTL --device $MDT0 changelog_register -n) + echo "Registered as changelog user $cl_user" + + rm -rf $DIR/$tdir + mkdir -p $DIR/$tdir + + $LFS changelog_clear $MDT0 $cl_user 0 + + # change something + touch $DIR/$tdir/{1..10} + + # stop the MDT + stop mds1 || error "Fail to stop MDT." + + # remount the MDT + start mds1 $mdt_dev $MDS_MOUNT_OPTS || error "Fail to start MDT." + + #after mount new plainllog is used + touch $DIR/$tdir/{11..19} + cat_sl=$(do_facet mds1 \ + "$DEBUGFS -R \\\"dump changelog_catalog cat.dmp\\\" $mdt_dev; \ + llog_reader cat.dmp | grep \\\"type=1064553b\\\" | wc -l") + + if (( cat_sl != 2 )); then + do_facet mds1 $LCTL --device $MDT0 changelog_deregister $cl_user + error "Changelog catalog has wrong number of slots $cat_sl" + fi + + $LFS changelog_clear $MDT0 $cl_user 0 + + cat_sl=$(do_facet mds1 \ + "$DEBUGFS -R \\\"dump changelog_catalog cat.dmp\\\" $mdt_dev; \ + llog_reader cat.dmp | grep \\\"type=1064553b\\\" | wc -l") + + do_facet mds1 $LCTL --device $MDT0 changelog_deregister $cl_user + + if (( cat_sl == 2 )); then + error "Empty plain llog was not deleted from changelog catalog" + fi + if (( cat_sl != 1 )); then + error "Active plain llog shouldn\`t be deleted from catalog" + fi +} +run_test 256 "Check llog delete for empty and not full state" + +test_257() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return + [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.55) ]] && + skip "Need MDS version at least 2.8.55" && return + + test_mkdir -p $DIR/$tdir + + setfattr -n trusted.name1 -v value1 $DIR/$tdir || + error "setfattr -n trusted.name1=value1 $DIR/$tdir failed" + stat $DIR/$tdir + +#define OBD_FAIL_MDS_XATTR_REP 0x161 + local mdtidx=$($LFS getstripe -M $DIR/$tdir) + local facet=mds$((mdtidx + 1)) + set_nodes_failloc $(facet_active_host $facet) 0x80000161 + getfattr -n trusted.name1 $DIR/$tdir 2> /dev/null + + stop $facet || error "stop MDS failed" + start $facet $(mdsdevname $((mdtidx + 1))) $MDS_MOUNT_OPTS || + error "start MDS fail" +} +run_test 257 "xattr locks are not lost" + +test_260() { +#define OBD_FAIL_MDC_CLOSE 0x806 + $LCTL set_param fail_loc=0x80000806 + touch $DIR/$tfile + +} +run_test 260 "Check mdc_close fail" cleanup_test_300() { trap 0 @@ -13617,6 +14604,8 @@ test_striped_dir() { } test_300a() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.0) ] && + skip "skipped for lustre < 2.7.0" && return [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return @@ -13626,6 +14615,8 @@ test_300a() { run_test 300a "basic striped dir sanity test" test_300b() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.0) ] && + skip "skipped for lustre < 2.7.0" && return [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return local i @@ -13656,6 +14647,8 @@ test_300b() { run_test 300b "check ctime/mtime for striped dir" test_300c() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.0) ] && + skip "skipped for lustre < 2.7.0" && return [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return local file_count @@ -13679,6 +14672,8 @@ test_300c() { run_test 300c "chown && check ls under striped directory" test_300d() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.7.0) ] && + skip "skipped for lustre < 2.7.0" && return [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return local stripe_count @@ -14147,6 +15142,7 @@ run_test 300o "unlink big sub stripe(> 65000 subdirs)" test_300p() { [ $PARALLEL == "yes" ] && skip "skip parallel run" && return [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + remote_mds_nodsh && skip "remote MDS with nodsh" && return mkdir -p $DIR/$tdir @@ -14162,6 +15158,26 @@ test_300p() { } run_test 300p "create striped directory without space" +test_300q() { + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + + local fd=$(free_fd) + local cmd="exec $fd<$tdir" + cd $DIR + $LFS mkdir -c $MDSCOUNT $tdir || error "create $tdir fails" + eval $cmd + cmd="exec $fd<&-" + trap "eval $cmd" EXIT + cd $tdir || error "cd $tdir fails" + rmdir ../$tdir || error "rmdir $tdir fails" + mkdir local_dir && error "create dir succeeds" + $LFS setdirstripe -i1 remote_dir && error "create remote dir succeeds" + eval $cmd + return 0 +} +run_test 300q "create remote directory under orphan directory" + prepare_remote_file() { mkdir $DIR/$tdir/src_dir || error "create remote source failed" @@ -14236,6 +15252,196 @@ test_310c() { } run_test 310c "open-unlink remote file with multiple links" +#LU-4825 +test_311() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.54) ] && + skip "lustre < 2.8.54 does not contain LU-4825 fix" && return + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + + local old_iused=$($LFS df -i | grep OST0000 | awk '{ print $3 }') + + mkdir -p $DIR/$tdir + $SETSTRIPE -i 0 -c 1 $DIR/$tdir + createmany -o $DIR/$tdir/$tfile. 1000 + + # statfs data is not real time, let's just calculate it + old_iused=$((old_iused + 1000)) + + local count=$(do_facet $SINGLEMDS "lctl get_param -n \ + osp.*OST0000*MDT0000.create_count") + local max_count=$(do_facet $SINGLEMDS "lctl get_param -n \ + osp.*OST0000*MDT0000.max_create_count") + for idx in $(seq $MDSCOUNT); do + do_facet mds$idx "lctl set_param -n \ + osp.*OST0000*MDT000?.max_create_count=0" + done + + $SETSTRIPE -i 0 $DIR/$tdir/$tfile || error "setstripe failed" + local index=$($GETSTRIPE -i $DIR/$tdir/$tfile) + [ $index -ne 0 ] || error "$tfile stripe index is 0" + + unlinkmany $DIR/$tdir/$tfile. 1000 + + for idx in $(seq $MDSCOUNT); do + do_facet mds$idx "lctl set_param -n \ + osp.*OST0000*MDT000?.max_create_count=$max_count" + do_facet mds$idx "lctl set_param -n \ + osp.*OST0000*MDT000?.create_count=$count" + done + + local new_iused + for i in $(seq 120); do + new_iused=$($LFS df -i | grep OST0000 | awk '{ print $3 }') + [ $((old_iused - new_iused)) -gt 800 ] && break + sleep 1 + done + + echo "waited $i sec, old Iused $old_iused, new Iused $new_iused" + [ $((old_iused - new_iused)) -gt 800 ] || + error "objs not destroyed after unlink" +} +run_test 311 "disable OSP precreate, and unlink should destroy objs" + +zfs_oid_to_objid() +{ + local ost=$1 + local objid=$2 + + local vdevdir=$(dirname $(facet_vdevice $ost)) + local cmd="$ZDB -e -p $vdevdir -dddd $(facet_device $ost)" + local zfs_zapid=$(do_facet $ost $cmd | + grep -w "/O/0/d$((objid%32))" -C 5 | + awk '/Object/{getline; print $1}') + local zfs_objid=$(do_facet $ost $cmd $zfs_zapid | + awk "/$objid = /"'{printf $3}') + + echo $zfs_objid +} + +zfs_object_blksz() { + local ost=$1 + local objid=$2 + + local vdevdir=$(dirname $(facet_vdevice $ost)) + local cmd="$ZDB -e -p $vdevdir -dddd $(facet_device $ost)" + local blksz=$(do_facet $ost $cmd $objid | + awk '/dblk/{getline; printf $4}') + + case "${blksz: -1}" in + k|K) blksz=$((${blksz:0:$((${#blksz} - 1))}*1024)) ;; + m|M) blksz=$((${blksz:0:$((${#blksz} - 1))}*1024*1024)) ;; + *) ;; + esac + + echo $blksz +} + +test_312() { # LU-4856 + [ $(facet_fstype ost1) = "zfs" ] || + { skip "the test only applies to zfs" && return; } + + local max_blksz=$(do_facet ost1 \ + $ZFS get -p recordsize $(facet_device ost1) | + awk '!/VALUE/{print $3}') + + # to make life a little bit easier + $LFS mkdir -c 1 -i 0 $DIR/$tdir + $LFS setstripe -c 1 -i 0 $DIR/$tdir + + local tf=$DIR/$tdir/$tfile + touch $tf + local oid=$($LFS getstripe $tf | awk '/obdidx/{getline; print $2}') + + # Get ZFS object id + local zfs_objid=$(zfs_oid_to_objid ost1 $oid) + + # block size change by sequential over write + local blksz + for ((bs=4096; bs <= max_blksz; bs <<= 2)); do + dd if=/dev/zero of=$tf bs=$bs count=1 oflag=sync conv=notrunc + + blksz=$(zfs_object_blksz ost1 $zfs_objid) + [ $blksz -eq $bs ] || error "blksz error: $blksz, expected: $bs" + done + rm -f $tf + + # block size change by sequential append write + dd if=/dev/zero of=$tf bs=4K count=1 oflag=sync conv=notrunc + oid=$($LFS getstripe $tf | awk '/obdidx/{getline; print $2}') + zfs_objid=$(zfs_oid_to_objid ost1 $oid) + + for ((count = 1; count < $((max_blksz / 4096)); count *= 2)); do + dd if=/dev/zero of=$tf bs=4K count=$count seek=$count \ + oflag=sync conv=notrunc + + blksz=$(zfs_object_blksz ost1 $zfs_objid) + blksz=$((blksz / 8192)) # in 2*4K unit + [ $blksz -eq $count ] || + error "blksz error(in 8k): $blksz, expected: $count" + done + rm -f $tf + + # random write + touch $tf + oid=$($LFS getstripe $tf | awk '/obdidx/{getline; print $2}') + zfs_objid=$(zfs_oid_to_objid ost1 $oid) + + dd if=/dev/zero of=$tf bs=8K count=1 oflag=sync conv=notrunc + blksz=$(zfs_object_blksz ost1 $zfs_objid) + [ $blksz -eq 8192 ] || error "blksz error: $blksz, expected: 8k" + + dd if=/dev/zero of=$tf bs=64K count=1 oflag=sync conv=notrunc seek=128 + blksz=$(zfs_object_blksz ost1 $zfs_objid) + [ $blksz -eq 65536 ] || error "blksz error: $blksz, expected: 64k" + + dd if=/dev/zero of=$tf bs=1M count=1 oflag=sync conv=notrunc + blksz=$(zfs_object_blksz ost1 $zfs_objid) + [ $blksz -eq 65536 ] || error "rewrite error: $blksz, expected: 64k" +} +run_test 312 "make sure ZFS adjusts its block size by write pattern" + +test_399() { # LU-7655 for OST fake write + # turn off debug for performance testing + local saved_debug=$($LCTL get_param -n debug) + $LCTL set_param debug=0 + + $SETSTRIPE -c 1 -i 0 $DIR/$tfile + + # get ost1 size - lustre-OST0000 + local ost1_avail_size=$($LFS df | awk /${ost1_svc}/'{ print $4 }') + local blocks=$((ost1_avail_size/2/1024)) # half avail space by megabytes + [ $blocks -gt 1000 ] && blocks=1000 # 1G in maximum + + local start_time=$(date +%s.%N) + dd if=/dev/zero of=$DIR/$tfile bs=1M count=$blocks oflag=sync || + error "real dd writing error" + local duration=$(bc <<< "$(date +%s.%N) - $start_time") + rm -f $DIR/$tfile + + # define OBD_FAIL_OST_FAKE_WRITE 0x238 + do_facet ost1 $LCTL set_param fail_loc=0x238 + + local start_time=$(date +%s.%N) + dd if=/dev/zero of=$DIR/$tfile bs=1M count=$blocks oflag=sync || + error "fake dd writing error" + local duration_fake=$(bc <<< "$(date +%s.%N) - $start_time") + + # verify file size + cancel_lru_locks osc + $CHECKSTAT -t file -s $((blocks * 1024 * 1024)) $DIR/$tfile || + error "$tfile size not $blocks MB" + + do_facet ost1 $LCTL set_param fail_loc=0 + + echo "fake write $duration_fake vs. normal write $duration in seconds" + [ $(bc <<< "$duration_fake < $duration") -eq 1 ] || + error_not_in_vm "fake write is slower" + + $LCTL set_param -n debug="$saved_debug" + rm -f $DIR/$tfile +} +run_test 399 "fake write should not be slower than normal write" + test_400a() { # LU-1606, was conf-sanity test_74 local extra_flags='' local out=$TMP/$tfile @@ -14258,6 +15464,7 @@ test_400a() { # LU-1606, was conf-sanity test_74 $CC -Wall -Werror $extra_flags -llustreapi -o $out $prog || error "client api broken" done + rm -f $out } run_test 400a "Lustre client api program can compile and link" @@ -14290,21 +15497,104 @@ test_400b() { # LU-1606, LU-5011 $CC -Wall -Werror -include $header -c -x c /dev/null -o $out || error "cannot compile '$header'" done + rm -f $out } run_test 400b "packaged headers can be compiled" -test_401() { #LU-7437 +test_401a() { #LU-7437 + local printf_arg=$(find -printf 2>&1 | grep "unrecognized:") + [ -n "$printf_arg" ] && skip_env "find does not support -printf" && + return #count the number of parameters by "list_param -R" local params=$($LCTL list_param -R '*' 2>/dev/null | wc -l) #count the number of parameters by listing proc files - local procs=$(find -L $proc_dirs -mindepth 1 2>/dev/null | wc -l) + local procs=$(find -L $proc_dirs -mindepth 1 -printf '%P\n' 2>/dev/null| + sort -u | wc -l) + + [ $params -eq $procs ] || + error "found $params parameters vs. $procs proc files" + + # test the list_param -D option only returns directories + params=$($LCTL list_param -R -D '*' 2>/dev/null | wc -l) + #count the number of parameters by listing proc directories + procs=$(find -L $proc_dirs -mindepth 1 -type d -printf '%P\n' 2>/dev/null | + sort -u | wc -l) [ $params -eq $procs ] || error "found $params parameters vs. $procs proc files" } -run_test 401 "Verify if 'lctl list_param -R' can list parameters recursively" +run_test 401a "Verify if 'lctl list_param -R' can list parameters recursively" + +test_401b() { + local save=$($LCTL get_param -n jobid_var) + local tmp=testing + + $LCTL set_param foo=bar jobid_var=$tmp bar=baz && + error "no error returned when setting bad parameters" + + local jobid_new=$($LCTL get_param -n foe jobid_var baz) + [[ "$jobid_new" == "$tmp" ]] || error "jobid tmp $jobid_new != $tmp" + + $LCTL set_param -n fog=bam jobid_var=$save bat=fog + local jobid_old=$($LCTL get_param -n foe jobid_var bag) + [[ "$jobid_old" == "$save" ]] || error "jobid new $jobid_old != $save" +} +run_test 401b "Verify 'lctl {get,set}_param' continue after error" + +test_401c() { + local jobid_var_old=$($LCTL get_param -n jobid_var) + local jobid_var_new + + $LCTL set_param jobid_var= && + error "no error returned for 'set_param a='" + + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_old" == "$jobid_var_new" ]] || + error "jobid_var was changed by setting without value" + + $LCTL set_param jobid_var && + error "no error returned for 'set_param a'" + + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_old" == "$jobid_var_new" ]] || + error "jobid_var was changed by setting without value" +} +run_test 401c "Verify 'lctl set_param' without value fails in either format." + +test_401d() { + local jobid_var_old=$($LCTL get_param -n jobid_var) + local jobid_var_new + local new_value="foo=bar" + + $LCTL set_param jobid_var=$new_value || + error "'set_param a=b' did not accept a value containing '='" + + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_new" == "$new_value" ]] || + error "'set_param a=b' failed on a value containing '='" + + # Reset the jobid_var to test the other format + $LCTL set_param jobid_var=$jobid_var_old + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_new" == "$jobid_var_old" ]] || + error "failed to reset jobid_var" + + $LCTL set_param jobid_var $new_value || + error "'set_param a b' did not accept a value containing '='" + + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_new" == "$new_value" ]] || + error "'set_param a b' failed on a value containing '='" + + $LCTL set_param jobid_var $jobid_var_old + jobid_var_new=$($LCTL get_param -n jobid_var) + [[ "$jobid_var_new" == "$jobid_var_old" ]] || + error "failed to reset jobid_var" +} +run_test 401d "Verify 'lctl set_param' accepts values containing '='" test_402() { + remote_mds_nodsh && skip "remote MDS with nodsh" && return $LFS setdirstripe -i 0 $DIR/$tdir || error "setdirstripe -i 0 failed" #define OBD_FAIL_MDS_FLD_LOOKUP 0x15c do_facet mds1 "lctl set_param fail_loc=0x8000015c" @@ -14313,6 +15603,195 @@ test_402() { } run_test 402 "Return ENOENT to lod_generate_and_set_lovea" +test_403() { + local file1=$DIR/$tfile.1 + local file2=$DIR/$tfile.2 + local tfile=$TMP/$tfile + + rm -f $file1 $file2 $tfile + + touch $file1 + ln $file1 $file2 + + # 30 sec OBD_TIMEOUT in ll_getattr() + # right before populating st_nlink + $LCTL set_param fail_loc=0x80001409 + stat -c %h $file1 > $tfile & + + # create an alias, drop all locks and reclaim the dentry + < $file2 + cancel_lru_locks mdc + cancel_lru_locks osc + sysctl -w vm.drop_caches=2 + + wait + + [ `cat $tfile` -gt 0 ] || error "wrong nlink count: `cat $tfile`" + + rm -f $tfile $file1 $file2 +} +run_test 403 "i_nlink should not drop to zero due to aliasing" + +test_404() { # LU-6601 + remote_mds_nodsh && skip "remote MDS with nodsh" && return + local mosps=$(do_facet $SINGLEMDS $LCTL dl | + awk '/osp .*-osc-MDT/ { print $4}') + + local osp + for osp in $mosps; do + echo "Deactivate: " $osp + do_facet $SINGLEMDS $LCTL --device %$osp deactivate + local stat=$(do_facet $SINGLEMDS $LCTL dl | + awk -vp=$osp '$4 == p { print $2 }') + [ $stat = IN ] || { + do_facet $SINGLEMDS $LCTL dl | grep -w $osp + error "deactivate error" + } + echo "Activate: " $osp + do_facet $SINGLEMDS $LCTL --device %$osp activate + local stat=$(do_facet $SINGLEMDS $LCTL dl | + awk -vp=$osp '$4 == p { print $2 }') + [ $stat = UP ] || { + do_facet $SINGLEMDS $LCTL dl | grep -w $osp + error "activate error" + } + done +} +run_test 404 "validate manual {de}activated works properly for OSPs" + +test_405() { + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.6.92) ] && + skip "Layout swap lock is not supported" && return + + check_swap_layouts_support && return 0 + + test_mkdir -p $DIR/$tdir + swap_lock_test -d $DIR/$tdir || + error "One layout swap locked test failed" +} +run_test 405 "Various layout swap lock tests" + +test_406() { + [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + [ $OSTCOUNT -lt 2 ] && skip "needs >= 2 OSTs" && return + [ -n "$FILESET" ] && skip "SKIP due to FILESET set" && return + [ $PARALLEL == "yes" ] && skip "skip parallel run" && return + [ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.50) ] && + skip "Need MDS version at least 2.8.50" && return + + local def_stripenr=$($GETSTRIPE -c $MOUNT) + local def_stripe_size=$($GETSTRIPE -S $MOUNT) + local def_stripe_offset=$($GETSTRIPE -i $MOUNT) + local def_pool=$($GETSTRIPE -p $MOUNT) + + local test_pool=$TESTNAME + pool_add $test_pool || error "pool_add failed" + pool_add_targets $test_pool 0 $(($OSTCOUNT - 1)) 1 || + error "pool_add_targets failed" + + # parent set default stripe count only, child will stripe from both + # parent and fs default + $SETSTRIPE -c 1 -i 1 -S $((def_stripe_size * 2)) -p $test_pool $MOUNT || + error "setstripe $MOUNT failed" + $LFS mkdir -c $MDSCOUNT $DIR/$tdir || error "mkdir $tdir failed" + $SETSTRIPE -c $OSTCOUNT $DIR/$tdir || error "setstripe $tdir failed" + for i in $(seq 10); do + local f=$DIR/$tdir/$tfile.$i + touch $f || error "touch failed" + local count=$($GETSTRIPE -c $f) + [ $count -eq $OSTCOUNT ] || + error "$f stripe count $count != $OSTCOUNT" + local offset=$($GETSTRIPE -i $f) + [ $offset -eq 1 ] || error "$f stripe offset $offset != 1" + local size=$($GETSTRIPE -S $f) + [ $size -eq $((def_stripe_size * 2)) ] || + error "$f stripe size $size != $((def_stripe_size * 2))" + local pool=$($GETSTRIPE -p $f) + [ $pool == $test_pool ] || error "$f pool $pool != $test_pool" + done + + # change fs default striping, delete parent default striping, now child + # will stripe from new fs default striping only + $SETSTRIPE -c 1 -S $def_stripe_size -i 0 $MOUNT || + error "change $MOUNT default stripe failed" + $SETSTRIPE -c 0 $DIR/$tdir || error "delete $tdir default stripe failed" + for i in $(seq 11 20); do + local f=$DIR/$tdir/$tfile.$i + touch $f || error "touch $f failed" + local count=$($GETSTRIPE -c $f) + [ $count -eq 1 ] || error "$f stripe count $count != 1" + local offset=$($GETSTRIPE -i $f) + [ $offset -eq 0 ] || error "$f stripe offset $offset != 0" + local size=$($GETSTRIPE -S $f) + [ $size -eq $def_stripe_size ] || + error "$f stripe size $size != $def_stripe_size" + local pool=$($GETSTRIPE -p $f) + [ "#$pool" == "#" ] || error "$f pool $pool is set" + + done + + unlinkmany $DIR/$tdir/$tfile. 1 20 + + # restore FS default striping + if [ -z $def_pool ]; then + $SETSTRIPE -c $def_stripenr -S $def_stripe_size \ + -i $def_stripe_offset $MOUNT || + error "restore default striping failed" + else + $SETSTRIPE -c $def_stripenr -S $def_stripe_size -p $def_pool \ + -i $def_stripe_offset $MOUNT || + error "restore default striping with $def_pool failed" + fi + + local f=$DIR/$tdir/$tfile + pool_remove_all_targets $test_pool $f + pool_remove $test_pool $f +} +run_test 406 "DNE support fs default striping" + +test_407() { + [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" && return + + [[ $(lustre_version_code $SINGLEMDS) -lt $(version_code 2.8.55) ]] && + skip "Need MDS version at least 2.8.55" && return + + $LFS mkdir -i 0 -c 1 $DIR/$tdir.0 || + error "$LFS mkdir -i 0 -c 1 $tdir.0 failed" + $LFS mkdir -i 1 -c 1 $DIR/$tdir.1 || + error "$LFS mkdir -i 1 -c 1 $tdir.1 failed" + touch $DIR/$tdir.0/$tfile.0 || error "touch $tdir.0/$tfile.0 failed" + + #define OBD_FAIL_DT_TXN_STOP 0x2019 + for idx in $(seq $MDSCOUNT); do + do_facet mds$idx "lctl set_param fail_loc=0x2019" + done + $LFS mkdir -c 2 $DIR/$tdir && error "$LFS mkdir -c 2 $tdir should fail" + mv $DIR/$tdir.0/$tfile.0 $DIR/$tdir.1/$tfile.1 && + error "mv $tdir.0/$tfile.0 $tdir.1/$tfile.1 should fail" + true +} +run_test 407 "transaction fail should cause operation fail" + +test_408() { + dd if=/dev/zero of=$DIR/$tfile bs=4096 count=1 oflag=direct + + #define OBD_FAIL_OSC_BRW_PREP_REQ2 0x40a + lctl set_param fail_loc=0x8000040a + # let ll_prepare_partial_page() fail + dd if=/dev/zero of=$DIR/$tfile bs=2048 count=1 conv=notrunc || true + + rm -f $DIR/$tfile + + # create at least 100 unused inodes so that + # shrink_icache_memory(0) should not return 0 + touch $DIR/$tfile-{0..100} + rm -f $DIR/$tfile-{0..100} + sync + + echo 2 > /proc/sys/vm/drop_caches +} +run_test 408 "drop_caches should not hang due to page leaks" + # # tests that do cleanup/setup should be run at the end #