X-Git-Url: https://git.whamcloud.com/?a=blobdiff_plain;f=lustre%2Ftests%2Fconf-sanity.sh;h=e3a56c7cd7305970306ededc46765543483c05eb;hb=276c22ae3869c1f775cded248d53b9c2a829c801;hp=7795fafd0cf92279864ef1b0d6bb9ef5bc21a954;hpb=9b4b2523d9a432ca10ee48cc0276d324e893801b;p=fs%2Flustre-release.git diff --git a/lustre/tests/conf-sanity.sh b/lustre/tests/conf-sanity.sh index 7795faf..e3a56c7 100644 --- a/lustre/tests/conf-sanity.sh +++ b/lustre/tests/conf-sanity.sh @@ -15,14 +15,12 @@ init_logging ALWAYS_EXCEPT="$CONF_SANITY_EXCEPT 32newtarball" # bug number for skipped test: LU-11915 -ALWAYS_EXCEPT="$ALWAYS_EXCEPT 110 115" +ALWAYS_EXCEPT="$ALWAYS_EXCEPT 110" # UPDATE THE COMMENT ABOVE WITH BUG NUMBERS WHEN CHANGING ALWAYS_EXCEPT! if $SHARED_KEY; then # bug number for skipped tests: LU-9795 (all below) - ALWAYS_EXCEPT="$ALWAYS_EXCEPT 0 31 32a 32d 35a" - ALWAYS_EXCEPT="$ALWAYS_EXCEPT 53a 53b 54b 76a 76b" - ALWAYS_EXCEPT="$ALWAYS_EXCEPT 76c 76d 78 103" + ALWAYS_EXCEPT="$ALWAYS_EXCEPT 84 86 103" fi if ! combined_mgs_mds; then @@ -532,6 +530,9 @@ test_5h() { run_test 5h "start mdt failure at mdt_fs_setup()" test_5i() { + (( $MDS1_VERSION >= $(version_code 2.12.54) )) || + skip "Need MDS version at least 2.12.54" + setup stop mds1 @@ -595,6 +596,27 @@ test_9() { } run_test 9 "test ptldebug and subsystem for mkfs" +test_10a() { + setup + + if ! combined_mgs_mds; then + files=$(do_facet mgs "find /{proc/fs,sys/fs,sys/kernel/debug}/lustre -type l -exec test ! -e {} \; -print") + [ -z $files ] || echo "MGS $files is a broken symlink" + fi + + files=$(do_facet mds1 "find /{proc/fs,sys/fs,sys/kernel/debug}/lustre -type l -exec test ! -e {} \; -print") + [ -z $files ] || echo "MDS $files is a broken symlink" + + files=$(do_facet ost1 "find /{proc/fs,sys/fs,sys/kernel/debug}/lustre -type l -exec test ! -e {} \; -print") + [ -z $files ] || echo "OSS $files is a broken symlink" + + files=$(do_facet client "find /{proc/fs,sys/fs,sys/kernel/debug}/lustre -type l -exec test ! -e {} \; -print") + [ -z $files ] || echo "clients $files is a broken symlink" + + cleanup || error "cleanup failed with rc $?" +} +run_test 10a "find lctl param broken symlinks" + # # Test 16 was to "verify that lustre will correct the mode of OBJECTS". # But with new MDS stack we don't care about the mode of local objects @@ -1884,8 +1906,9 @@ t32_test() { mkfsoptions="--mkfsoptions=\\\"-J size=8\\\"" fi - add $SINGLEMDS $(mkfs_opts mds2 $fs2mdsdev $fsname) --reformat \ - $mkfsoptions $fs2mdsdev $fs2mdsvdev > /dev/null || { + add $SINGLEMDS $(mds2failover_HOST="" \ + mkfs_opts mds2 $fs2mdsdev $fsname) --reformat \ + $mkfsoptions $fs2mdsdev $fs2mdsvdev > /dev/null || { error_noexit "Mkfs new MDT failed" return 1 } @@ -2077,11 +2100,10 @@ t32_test() { shall_cleanup_lustre=true $r $LCTL set_param debug="$PTLDEBUG" - # Leave re-enabling this to a separate patch for LU-11558 - # t32_verify_quota $SINGLEMDS $fsname $tmp/mnt/lustre || { - # error_noexit "verify quota failed" - # return 1 - #} + t32_verify_quota $SINGLEMDS $fsname $tmp/mnt/lustre || { + error_noexit "verify quota failed" + return 1 + } if $r test -f $tmp/list; then # @@ -3266,7 +3288,7 @@ test_43a() { echo "222" > $DIR/$tfile-rootfile || error "write 2 failed" chmod go-rw $DIR/$tfile-rootfile || error "chmod 2 faield" - mkdir $DIR/$tdir-rootdir || error "mkdir failed" + mkdir_on_mdt0 $DIR/$tdir-rootdir || error "mkdir failed" chmod go-rwx $DIR/$tdir-rootdir || error "chmod 3 failed" touch $DIR/$tdir-rootdir/tfile-1 || error "touch failed" @@ -3934,7 +3956,7 @@ test_50i() { start_ost2 || error "Unable to start OST2" mount_client $MOUNT || error "client start failed" - mkdir $DIR/$tdir || error "mkdir $DIR/$tdir failed" + mkdir_on_mdt0 $DIR/$tdir || error "mkdir $DIR/$tdir failed" if [[ $PERM_CMD == *"set_param -P"* ]]; then $PERM_CMD mdc.${FSNAME}-MDT0001-mdc-*.active=0 && @@ -5013,8 +5035,9 @@ test_69() { if [ $num_create -gt 0 ]; then # Check the number of inodes available on OST0 local files=0 - local ifree=$($LFS df -i $MOUNT | awk '/OST0000/ { print $4 }') - log "On OST0, $ifree inodes available. Want $num_create." + local ifree=$($LFS df -i $MOUNT | + awk '/OST0000/ { print $4 }'; exit ${PIPESTATUS[0]}) + log "On OST0, $ifree inodes available. Want $num_create. rc=$?" $LFS setstripe -i 0 $DIR/$tdir || error "$LFS setstripe -i 0 $DIR/$tdir failed" @@ -5050,8 +5073,9 @@ test_69() { local idx=$($LFS getstripe -i $DIR/$tdir/$tfile-last) [ $idx -ne 0 ] && error "$DIR/$tdir/$tfile-last on $idx not 0" || true - local iused=$($LFS df -i $MOUNT | awk '/OST0000/ { print $3 }') - log "On OST0, $iused used inodes" + local iused=$($LFS df -i $MOUNT | + awk '/OST0000/ { print $3 }'; exit ${PIPESTATUS[0]}) + log "On OST0, $iused used inodes rc=$?" [ $iused -ge $((ost_max_pre/2 + 1000)) ] && error "OST replacement created too many inodes; $iused" cleanup || error "cleanup failed with $?" @@ -5998,7 +6022,8 @@ test_82a() { # LU-4665 mount_client $MOUNT || error "mount client $MOUNT failed" wait_osts_up - $LFS df $MOUNT || error "$LFS df $MOUNT failed" + $LFS df $MOUNT + check_lfs_df_ret_val $? || error "$LFS df $MOUNT failed" mkdir $DIR/$tdir || error "mkdir $DIR/$tdir failed" stack_trap "do_nodes $(comma_list $(mdts_nodes)) \ @@ -6113,7 +6138,8 @@ test_82b() { # LU-4665 mount_client $MOUNT || error "mount client $MOUNT failed" wait_osts_up - $LFS df $MOUNT || error "$LFS df $MOUNT failed" + $LFS df $MOUNT + check_lfs_df_ret_val $? || error "$LFS df $MOUNT failed" mkdir $DIR/$tdir || error "mkdir $DIR/$tdir failed" # Create a new pool and add OSTs into it. @@ -6466,12 +6492,15 @@ test_89() { # LU-7131 stopall - [ "$mds1_FSTYPE" == zfs ] && import_zpool mds1 + if [[ "$mds1_FSTYPE" == zfs ]]; then + import_zpool mds1 || return ${PIPESTATUS[0]} + fi + # Check that parameters are added correctly echo "tunefs --param $key=$val1" - do_facet mds "$TUNEFS --param $key=$val1 $mdsdev >/dev/null" || + do_facet mds1 "$TUNEFS --param $key=$val1 $mdsdev >/dev/null" || error "tunefs --param $key=$val1 failed" - params=$(do_facet mds $TUNEFS --dryrun $mdsdev) || + params=$(do_facet mds1 $TUNEFS --dryrun $mdsdev) || error "tunefs --dryrun failed" params=${params##*Parameters:} params=${params%%exiting*} @@ -6480,9 +6509,9 @@ test_89() { # LU-7131 # Check that parameters replace existing instances when added echo "tunefs --param $key=$val2" - do_facet mds "$TUNEFS --param $key=$val2 $mdsdev >/dev/null" || + do_facet mds1 "$TUNEFS --param $key=$val2 $mdsdev >/dev/null" || error "tunefs --param $key=$val2 failed" - params=$(do_facet mds $TUNEFS --dryrun $mdsdev) || + params=$(do_facet mds1 $TUNEFS --dryrun $mdsdev) || error "tunefs --dryrun failed" params=${params##*Parameters:} params=${params%%exiting*} @@ -6493,9 +6522,9 @@ test_89() { # LU-7131 # Check that a parameter is erased properly echo "tunefs --erase-param $key" - do_facet mds "$TUNEFS --erase-param $key $mdsdev >/dev/null" || + do_facet mds1 "$TUNEFS --erase-param $key $mdsdev >/dev/null" || error "tunefs --erase-param $key failed" - params=$(do_facet mds $TUNEFS --dryrun $mdsdev) || + params=$(do_facet mds1 $TUNEFS --dryrun $mdsdev) || error "tunefs --dryrun failed" params=${params##*Parameters:} params=${params%%exiting*} @@ -6503,22 +6532,25 @@ test_89() { # LU-7131 error "on-disk parameter not erased correctly via tunefs" # Check that all the parameters are erased + do_facet mds1 "$TUNEFS --param $key=$val1 $mdsdev >/dev/null" || + error "tunefs --param $key=$val1 failed" echo "tunefs --erase-params" - do_facet mds "$TUNEFS --erase-params $mdsdev >/dev/null" || + do_facet mds1 "$TUNEFS --erase-params $mdsdev >/dev/null" || error "tunefs --erase-params failed" - params=$(do_facet mds $TUNEFS --dryrun $mdsdev) || + params=$(do_facet mds1 $TUNEFS --dryrun $mdsdev) || error "tunefs --dryrun failed" params=${params##*Parameters:} params=${params%%exiting*} - [ -z $params ] || - error "all on-disk parameters not erased correctly via tunefs" + params=$(echo $params | tr ' ' '\n') + [ -z "$params" ] || + error "all on-disk parameters not erased correctly via tunefs $params" # Check the order of options --erase-params and --param echo "tunefs --param $key=$val1 --erase-params" - do_facet mds \ + do_facet mds1 \ "$TUNEFS --param $key=$val1 --erase-params $mdsdev >/dev/null"|| error "tunefs --param $key=$val1 --erase-params failed" - params=$(do_facet mds $TUNEFS --dryrun $mdsdev) || + params=$(do_facet mds1 $TUNEFS --dryrun $mdsdev) || error "tunefs --dryrun failed" params=${params##*Parameters:} params=${params%%exiting*} @@ -6871,7 +6903,7 @@ check_uuid_on_ost() { check_uuid_on_mdt() { local nid=$1 - do_facet $SINGLEMDS "$LCTL get_param mdt.${FSNAME}*.exports.'$nid'.uuid" + do_facet $SINGLEMDS "$LCTL get_param mdt.${mds1_svc}*.exports.'$nid'.uuid" } test_91() { @@ -6915,6 +6947,7 @@ test_91() { echo "evict $nid" do_facet $SINGLEMDS \ "$LCTL set_param -n mdt.${mds1_svc}.evict_client nid:$nid" + sleep 1 # eviction above is async, give it some time to proceed found=$(check_uuid_on_mdt $nid | grep $uuid) [ -n "$found" ] && error "found $uuid $nid on MDT" @@ -6937,63 +6970,33 @@ generate_ldev_conf() { local ldevconfpath=$1 local fstype= local fsldevformat="" - touch $ldevconfpath + rm -f $ldevconfpath - fstype=$(facet_fstype mgs) - if [ "$fstype" == zfs ]; then - fsldevformat="$fstype:" - else + local facets="mgs,$(get_facets OST),$(get_facets MDS)" + for facet in ${facets//,/ }; do fsldevformat="" - fi - - printf "%s\t-\t%s-MGS0000\t%s%s\n" \ - $mgs_HOST \ - $FSNAME \ - $fsldevformat \ - $(mgsdevname) > $ldevconfpath - - local mdsfo_host=$mdsfailover_HOST; - if [ -z "$mdsfo_host" ]; then - mdsfo_host="-" - fi - - for num in $(seq $MDSCOUNT); do - fstype=$(facet_fstype mds$num) - if [ "$fstype" == zfs ]; then - fsldevformat="$fstype:" - else - fsldevformat="" - fi - - printf "%s\t%s\t%s-MDT%04d\t%s%s\n" \ - $mds_HOST \ - $mdsfo_host \ - $FSNAME \ - $num \ - $fsldevformat \ - $(mdsdevname $num) >> $ldevconfpath - done - - local ostfo_host=$ostfailover_HOST; - if [ -z "$ostfo_host" ]; then - ostfo_host="-" - fi - - for num in $(seq $OSTCOUNT); do - fstype=$(facet_fstype ost$num) - if [ "$fstype" == zfs ]; then - fsldevformat="$fstype:" - else - fsldevformat="" + fstype=$(facet_fstype $facet) + [ "$fstype" = zfs ] && fsldevformat="$fstype:" + local host=$(facet_host $facet) + local fo="-" + local varfo=${facet}failover_HOST + if [ $facet == mgs ] && combined_mgs_mds; then + varfo=mds1failover_HOST fi - - printf "%s\t%s\t%s-OST%04d\t%s%s\n" \ - $ost_HOST \ - $ostfo_host \ + [ -n "${!varfo}" ] && fo=${!varfo} + local type=$(echo $facet | tr -d "[:digit:]" | \ + tr "[:lower:]" "[:upper:]" | sed s/MDS/MDT/ ) + local num=1 + [ ${facet} == mgs ] || + num=$(facet_number $facet) + printf "%s\t%s\t%s-%s%04x\t%s%s\n" \ + ${host} \ + ${fo} \ $FSNAME \ - $num \ + $type \ + $(( num - 1 )) \ $fsldevformat \ - $(ostdevname $num) >> $ldevconfpath + $(facet_device $facet) >> $ldevconfpath done echo "----- $ldevconfpath -----" @@ -7015,8 +7018,8 @@ generate_nids() { } compare_ldev_output() { - ldev_output=$1 - expected_output=$2 + local ldev_output=$1 + local expected_output=$2 sort $expected_output -o $expected_output sort $ldev_output -o $ldev_output @@ -7047,30 +7050,27 @@ test_92() { generate_nids $NIDSPATH # echo the mgs nid and compare it to environment variable MGSNID - # also, ldev.conf and nids is a server side thing, use the OSS - # hostname - local output - output=$($LDEV -c $LDEVCONFPATH -H $ost_HOST -n $NIDSPATH echo %m) - - echo "-- START OF LDEV OUTPUT --" - echo -e "$output" - echo "--- END OF LDEV OUTPUT ---" - - # ldev failed, error - if [ $? -ne 0 ]; then - rm $LDEVCONFPATH $NIDSPATH - error "ldev failed to execute!" - fi - - # need to process multiple lines because of combined MGS and MDS - echo -e $output | awk '{ print $2 }' | while read -r line ; do - if [ "$line" != "$MGSNID" ]; then - rm $LDEVCONFPATH $NIDSPATH - error "ldev failed mgs nid '$line', expected '$MGSNID'" - fi + local facets="$(get_facets OST),$(get_facets MDS),mgs" + for facet in ${facets//,/ }; do + local host=$(facet_host $facet) + local output=$($LDEV -c $LDEVCONFPATH -H $host -n $NIDSPATH echo %m) + + echo "-- START OF LDEV OUTPUT --" + echo -e "$output" + echo "--- END OF LDEV OUTPUT ---" + + [ -z "$output" ] && + error "ldev failed to execute!" + + # need to process multiple lines because of + # several targets on host + echo -e $output | awk '{ print $2 }' | while read -r line ; do + [ "$line" = "$MGSNID" ] || + error "ldev failed mgs nid '$line', \ + expected '$MGSNID'" + done done - - rm $LDEVCONFPATH $NIDSPATH + rm -f $LDEVCONFPATH $NIDSPATH } run_test 92 "ldev returns MGS NID correctly in command substitution" @@ -7129,11 +7129,11 @@ test_94() { printf "%s-MGS0000\n" $FSNAME > $EXPECTED_OUTPUT for num in $(seq $MDSCOUNT); do - printf "%s-MDT%04d\n" $FSNAME $num >> $EXPECTED_OUTPUT + printf "%s-MDT%04x\n" $FSNAME $((num - 1)) >> $EXPECTED_OUTPUT done for num in $(seq $OSTCOUNT); do - printf "%s-OST%04d\n" $FSNAME $num >> $EXPECTED_OUTPUT + printf "%s-OST%04x\n" $FSNAME $((num - 1)) >> $EXPECTED_OUTPUT done compare_ldev_output $LDEV_OUTPUT $EXPECTED_OUTPUT @@ -7261,19 +7261,13 @@ test_96() { echo "$mgs_HOST-$(facet_fstype mgs)" > $EXPECTED_OUTPUT - if [ "$mgs_HOST" == "$mds_HOST" ]; then - for num in $(seq $MDSCOUNT); do - echo "$mds_HOST-$(facet_fstype mds$num)" \ - >> $EXPECTED_OUTPUT - done - fi - - if [ "$mgs_HOST" == "$ost_HOST" ]; then - for num in $(seq $OSTCOUNT); do - echo "$ost_HOST-$(facet_fstype ost$num)" \ + local facets="$(get_facets OST),$(get_facets MDS)" + for facet in ${facets//,/ }; do + local host=$(facet_host $facet) + [ "$mgs_HOST" == "$host" ] && + echo "$host-$(facet_fstype $facet)" \ >> $EXPECTED_OUTPUT - done - fi + done compare_ldev_output $LDEV_OUTPUT $EXPECTED_OUTPUT @@ -7309,7 +7303,7 @@ test_97() { fi for num in $(seq $MDSCOUNT); do - printf "%s-MDT%04d\n" $FSNAME $num >> $EXPECTED_OUTPUT + printf "%s-MDT%04x\n" $FSNAME $((num - 1)) >> $EXPECTED_OUTPUT done compare_ldev_output $LDEV_OUTPUT $EXPECTED_OUTPUT @@ -7329,7 +7323,7 @@ test_97() { rm $EXPECTED_OUTPUT for num in $(seq $OSTCOUNT); do - printf "%s-OST%04d\n" $FSNAME $num >> $EXPECTED_OUTPUT + printf "%s-OST%04x\n" $FSNAME $((num - 1)) >> $EXPECTED_OUTPUT done compare_ldev_output $LDEV_OUTPUT $EXPECTED_OUTPUT @@ -7437,7 +7431,7 @@ test_100() { } run_test 100 "check lshowmount lists MGS, MDT, OST and 0@lo" -test_101() { +test_101a() { local createmany_pid local dev=$FSNAME-OST0000-osc-MDT0000 setup @@ -7464,7 +7458,29 @@ test_101() { unlinkmany $DIR1/$tdir/$tfile-%d 50000 cleanup } -run_test 101 "Race MDT->OST reconnection with create" +run_test 101a "Race MDT->OST reconnection with create" + +test_101b () { + local dev=$FSNAME-OST0000-osc-MDT0000 + local dir=$DIR1/$tdir + setup + + mkdir $dir + $LFS setstripe -c 1 -i 0 $dir + do_facet $SINGLEMDS "$LCTL --device $dev deactivate;" +#define OBD_FAIL_OSP_CON_EVENT_DELAY 0x2107 + do_facet mds1 "$LCTL set_param fail_loc=0x80002107 fail_val=20" + do_facet $SINGLEMDS "$LCTL --device $dev activate;" + stop_ost + sleep 25 + start_ost + + wait_osc_import_state client ost1 FULL + touch $dir/$tfile || error "Can't create file" + + cleanup +} +run_test 101b "Race events DISCONNECT and ACTIVE in osp" test_102() { [[ "$MDS1_VERSION" -gt $(version_code 2.9.53) ]] || @@ -8003,7 +8019,6 @@ test_108b() { } run_test 108b "migrate from ZFS to ldiskfs" - # # set number of permanent parameters # @@ -8428,6 +8443,8 @@ test_112() { (( $val == 1 )) || error "obdfilter.$FSNAME-OST0001*.no_precreate=$val" mount_client $MOUNT || error "mount client failed" + wait_osc_import_state mds1 ost1 FULL + wait_osc_import_state client ost1 FULL wait_osc_import_state client ost2 FULL $LFS setstripe -i 0 $DIR/$tfile.0 || @@ -8439,6 +8456,8 @@ test_112() { sleep_maxage $LFS setstripe -i 1 $DIR/$tfile.2 || error "failed to create $tfile.2 on ost1 facet" + # files not cleaned with ONLY_REPEAT because of client unmount below + rm -f $DIR/$tfile.[012] stop_ost2 || error "stop ost2 facet failed" cleanup } @@ -8463,20 +8482,21 @@ test_115() { echo "$dbfs_ver" | egrep -w "1.44.3.wc1|1.44.5.wc1|1.45.2.wc1" && skip_env "This version of debugfs doesn't show inode number" - is_dm_flakey_dev $SINGLEMDS $(mdsdevname 1) && - skip "This test can not be executed on flakey dev" - IMAGESIZE=$((3072 << 30)) # 3072 GiB stopall + local saved_flakey=${FLAKEY} + stack_trap "FLAKEY=$saved_flakey" EXIT + FLAKEY=false + echo "client1: " lctl dl mount | grep lustre echo "mds1: " - do_facet mds1 "hostname; ifconfig; lctl dl; mount" + do_facet mds1 "hostname; lctl dl; mount" echo "ost1: " - do_facet ost1 "hostname; ifconfig; lctl dl; mount" + do_facet ost1 "hostname; lctl dl; mount" # We need MDT size 3072GB, because it is smallest # partition that can store 2B inodes do_facet $SINGLEMDS "mkdir -p $TMP/$tdir" @@ -8503,21 +8523,23 @@ test_115() { mkdir -p $DIR/$tdir || error "mkdir $DIR/$tdir fail" goal="/sys/fs/ldiskfs/$(basename $mdsdev)/inode_goal" -echo goal: $goal + echo goal: $goal # 2147483648 is 0x80000000 do_facet $SINGLEMDS "echo 2147483648 >> $goal; grep . $goal" touch $DIR/$tdir/$tfile - # attrs from 1 to 15 go to block, 16th - to inode - for i in {1..16}; do + # attrs from 1 to 16 go to block, 17th - to inode + for i in {1..17}; do local nm="trusted.ea$i" setfattr -n $nm -v $(printf "xattr%0250d" $i) $DIR/$tdir/$tfile done + do_facet $SINGLEMDS $DEBUGFS -c -R "stat ROOT/$tdir/$tfile" $mdsdev + # inode <2147483649> trusted.ea16 (255) local inode_num=$(do_facet $SINGLEMDS \ "$DEBUGFS -c -R 'stat ROOT/$tdir/$tfile' $mdsdev" | - awk '/ea16/ { print $2 }' | + awk '/ea17/ { print $2 }' | sed -e 's/>//' -e 's//dev/null + # mount after writeconf will make "add osp" added to mdt0 config: + # 53 (224)marker 60 (flags=0x01, v2.5.1.0) lustre-MDT0001 'add osp' + # 54 (080)add_uuid nid=... 0: 1:... + # 55 (144)attach 0:lustre-MDT0001-osp-MDT0000 1:osp 2:... + # 56 (144)setup 0:lustre-MDT0001-osp-MDT0000 1:... 2:... + # 57 (136)modify_mdc_tgts add 0:lustre-MDT0000-mdtlov 1:... 2:1 3:1 + # duplicate modify_mdc_tgts caused crashes + + debug_size_save + # using larger debug_mb size to avoid lctl dk log truncation + size_mb=$((DEBUG_SIZE_SAVED * 4)) + for i in {1..3}; do + stop_mdt 2 + # though config processing stops after failed attach and setup + # it will proceed after the failed command after each writeconf + # this is the original scenario of the issue + do_facet mds2 "$TUNEFS --writeconf $(mdsdevname 2)" &>/dev/null + do_facet mds1 "$LCTL set_param debug_mb=$size_mb" + start_mdt 2 + + wait_update_facet_cond mds1 \ + "$LCTL dk | grep -c Processed.log.$FSNAME-MDT0000" \ + ">" 1 300 + done + debug_size_restore + + [[ -z "$had_config" ]] && do_facet mds1 lctl set_param debug=-config + + reformat +} +run_test 119 "writeconf on slave mdt shouldn't duplicate mdc/osp and crash" + test_120() { # LU-11130 [ "$MDSCOUNT" -lt 2 ] && skip "mdt count < 2" [ "$mds1_FSTYPE" != ldiskfs ] && @@ -8602,7 +8671,19 @@ test_120() { # LU-11130 } run_test 120 "cross-target rename should not create bad symlinks" -test_122() { +test_121(){ + stopall + start_mgsmds || error "MGS MDS Start failed" + fail mgs + stop_mds || error "Stopping MDSes failed" + #failback + start_mds + fail mgs + stop_mds || error "Stopping MDSes failed" +} +run_test 121 "failover MGS" + +test_122a() { [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" [[ "$OST1_VERSION" -ge $(version_code 2.11.53) ]] || skip "Need OST version at least 2.11.53" @@ -8621,7 +8702,70 @@ test_122() { cleanup } -run_test 122 "Check OST sequence update" +run_test 122a "Check OST sequence update" + +test_122b() { + [[ "$OST1_VERSION" -ge $(version_code 2.11.53) ]] || + skip "Need OST version at least 2.11.53" + local err + + reformat + LOAD_MODULES_REMOTE=true load_modules +#define OBD_FAIL_OFD_SET_OID 0x1e0 + do_facet ost1 $LCTL set_param fail_loc=0x00001e0 + + stack_trap cleanup EXIT + setup_noconfig + do_facet ost1 $LCTL set_param obdfilter.*.precreate_batch=256 + $LFS mkdir -i0 -c1 $DIR/$tdir || error "failed to create directory" + $LFS setstripe -i0 -c1 $DIR/$tdir || error "failed to setstripe" + do_facet ost1 $LCTL set_param fail_loc=0 + # overflow IDIF 32bit and create > OST_MAX_PRECREATE*5 + # so a new wrong sequence would differ from an original with error + #define OST_MAX_PRECREATE 20000 + local ost_max_precreate=20100 + local num_create=$(( ost_max_precreate * 5 )) + + # Check the number of inodes available on OST0 + local files=0 + local ifree=$($LFS df -i $MOUNT | + awk '/OST0000/ { print $4 }'; exit ${PIPESTATUS[0]}) + + log "On OST0, $ifree inodes available. Want $num_create. rc=$?" + + if [ $ifree -lt 10000 ]; then + files=$(( ifree - 50 )) + else + files=10000 + fi + + local j=$((num_create / files + 1)) + + for i in $(seq 1 $j); do + createmany -o $DIR/$tdir/$tfile-$i- $files || + error "createmany fail create $files files: $?" + unlinkmany $DIR/$tdir/$tfile-$i- $files || + error "unlinkmany failed unlink $files files" + done + sync + touch $DIR/$tdir/$tfile + do_facet ost1 sync + #we need a write req during recovery for ofd_seq_load + replay_barrier ost1 + dd if=/dev/urandom of=$DIR/$tdir/$tfile bs=1024k count=1 oflag=sync || + error "failed to write file" + + # OBD_FAIL_OST_CREATE_NET 0x204 + do_facet ost1 $LCTL set_param fail_loc=0x80000204 + fail ost1 + createmany -o $DIR/$tdir/file_ 100 + sync + + err=$(do_facet ost1 dmesg | tac | sed "/Recovery over/,$ d" | + grep "OST replaced or reformatted") + [ -z "$err" ] || error $err +} +run_test 122b "Check OST sequence wouldn't change when IDIF 32bit overflows" test_123aa() { remote_mgs_nodsh && skip "remote MGS with nodsh" @@ -8652,11 +8796,15 @@ test_123ab() { local yaml local orig_val + local mgs_arg="" + + [[ $MGS_VERSION -gt $(version_code 2.13.54) ]] || + mgs_arg="--device MGS" orig_val=$(do_facet mgs $LCTL get_param jobid_name) do_facet mgs $LCTL set_param -P jobid_name="TESTNAME" - yaml=$(do_facet mgs $LCTL --device MGS llog_print params | + yaml=$(do_facet mgs $LCTL $mgs_arg llog_print params | grep jobid_name | tail -n 1) local param=$(awk '{ print $10 }' <<< "$yaml") @@ -8675,12 +8823,16 @@ test_123ac() { # LU-11566 local start=10 local end=50 + local mgs_arg="" + + [[ $MGS_VERSION -gt $(version_code 2.13.54) ]] || + mgs_arg="--device MGS" [ -d $MOUNT/.lustre ] || setup # - { index: 10, event: add_uuid, nid: 192.168.20.1@tcp(0x20000c0a81401, # node: 192.168.20.1@tcp } - do_facet mgs $LCTL --device MGS \ + do_facet mgs $LCTL $mgs_arg \ llog_print --start $start --end $end $FSNAME-client | tr -d , | while read DASH BRACE INDEX idx EVENT BLAH BLAH BLAH; do (( idx >= start )) || error "llog_print index $idx < $start" @@ -8716,30 +8868,43 @@ test_123ad() { # LU-11566 run_test 123ad "llog_print shows all records" test_123ae() { # LU-11566 + local max + local mgs_arg="" + local log + local id + local orig + local new + local rpcs + remote_mgs_nodsh && skip "remote MGS with nodsh" [ -d $MOUNT/.lustre ] || setupall - local max=$($LCTL get_param -n osc.*-OST0000-*.max_dirty_mb | head -1) + max=$($LCTL get_param -n osc.*-OST0000-*.max_dirty_mb | head -1) + pgs=$($LCTL get_param -n osc.*-OST0000-*.max_pages_per_rpc | head -1) + [[ $MGS_VERSION -gt $(version_code 2.13.54) ]] || + mgs_arg="--device MGS" if do_facet mgs "$LCTL help llog_cancel" 2>&1| grep -q -- --log_id; then # save one set_param -P record in case none exist - do_facet mgs $LCTL set_param -P osc.*.max_dirty_mb=$max - local log=params - local orig=$(do_facet mgs $LCTL --device MGS llog_print $log | - tail -1 | awk '{ print $4 }' | tr -d , ) + do_facet mgs $LCTL set_param -P osc.*.max_pages_per_rpc=$pgs + stack_trap "do_facet mgs $LCTL set_param -P -d \ + osc.*.max_pages_per_rpc" + + log=params + orig=$(do_facet mgs $LCTL $mgs_arg llog_print $log | + tail -1 | awk '{ print $4 }' | tr -d , ) do_facet mgs $LCTL set_param -P osc.*.max_dirty_mb=$max - do_facet mgs $LCTL --device MGS llog_print $log | tail -1 | + do_facet mgs $LCTL $mgs_arg llog_print $log | tail -1 | grep "parameter: osc.*.max_dirty_mb" || error "new set_param -P wasn't stored in params log" # - { index: 71, event: set_param, device: general, # param: osc.*.max_dirty_mb, value: 256 } - local id=$(do_facet mgs $LCTL --device MGS llog_print $log | - tail -1 | awk '{ print $4 }' | tr -d , ) - - do_facet mgs $LCTL --device MGS llog_cancel $log --log_idx=$id - local new=$(do_facet mgs $LCTL --device MGS llog_print $log | + id=$(do_facet mgs $LCTL $mgs_arg llog_print $log | + tail -1 | awk '{ print $4 }' | tr -d , ) + do_facet mgs $LCTL $mgs_arg llog_cancel $log --log_idx=$id + local new=$(do_facet mgs $LCTL $mgs_arg llog_print $log | tail -1 | awk '{ print $4 }' | tr -d , ) (( new == orig )) || error "new llog_cancel now $new, not at $orig records" @@ -8748,18 +8913,25 @@ test_123ae() { # LU-11566 # test old positional parameters for a while still if [ "$MGS_VERSION" -le $(version_code 3.1.53) ]; then log=$FSNAME-client + + do_facet mgs $LCTL conf_param \ + $FSNAME-OST0000.osc.max_pages_per_rpc=$pgs + stack_trap "do_facet mgs $LCTL conf_param -d \ + $FSNAME-OST0000.osc.max_pages_per_rpc" + orig=$(do_facet mgs $LCTL --device MGS llog_print $log | tail -1 | awk '{ print $4 }' | tr -d , ) do_facet mgs $LCTL conf_param $FSNAME-OST0000.osc.max_dirty_mb=$max do_facet mgs $LCTL --device MGS llog_print $log | tail -1 | grep "parameter: osc.max_dirty_mb" || error "old conf_param wasn't stored in params log" - + do_facet mgs $LCTL --device MGS llog_print $log # - { index: 71, event: conf_param, device: testfs-OST0000-osc, # param: osc.max_dirty_mb=256 } id=$(do_facet mgs $LCTL --device MGS llog_print $log | tail -1 | awk '{ print $4 }' | tr -d , ) do_facet mgs $LCTL --device MGS llog_cancel $log $id + do_facet mgs $LCTL --device MGS llog_print $log new=$(do_facet mgs $LCTL --device MGS llog_print $log | tail -1 | awk '{ print $4 }' | tr -d , ) (( new == orig )) || @@ -8817,6 +8989,36 @@ test_123af() { #LU-13609 } run_test 123af "llog_catlist can show all config files correctly" +test_123ag() { # LU-15142 + local rec + local orig_val + + remote_mgs_nodsh && skip "remote MGS with nodsh" + (( $MGS_VERSION >= $(version_code 2.14.55) )) || + skip "Need server version least 2.14.55" + + [ -d $MOUNT/.lustre ] || setup + + orig_val=$(do_facet mgs $LCTL get_param jobid_name) + stack_trap "do_facet mgs $LCTL set_param -P jobid_name=$orig_val" + + do_facet mgs $LCTL set_param -P jobid_name="TESTNAME1" + do_facet mgs $LCTL set_param -P -d jobid_name + rec=$(do_facet mgs $LCTL --device MGS llog_print params | + grep -c jobid_name) + (( rec == 0 )) || error "parameter was not deleted, check #1" + do_facet mgs $LCTL set_param -P jobid_name="TESTNAME1" + rec=$(do_facet mgs $LCTL --device MGS llog_print params | + grep -c jobid_name) + (( rec == 1)) || error "parameter is not set" + # usage with ordinary set_param format works too + do_facet mgs $LCTL set_param -P -d jobid_name="ANY" + rec=$(do_facet mgs $LCTL --device MGS llog_print params | + grep -c jobid_name) + (( rec == 0 )) || error "parameter was not deleted, check #2" +} +run_test 123ag "llog_print skips values deleted by set_param -P -d" + test_123F() { remote_mgs_nodsh && skip "remote MGS with nodsh" @@ -8839,10 +9041,7 @@ test_123F() { echo "Writeconf" writeconf_all echo "Remounting" - mountmgs - mountmds - mountoss - mountcli + setup_noconfig # Reapply the config from before echo "Setting configuration parameters" @@ -8865,6 +9064,12 @@ test_124() [ -z $mds2failover_HOST ] && skip "needs MDT failover setup" setup + do_facet mgs $LCTL --device MGS llog_print $FSNAME-client | + grep 1.2.3.4@tcp && error "Should not be fake nid" + do_facet mgs $LCTL conf_param $FSNAME-MDT0001.failover.node=1.2.3.4@tcp\ + || error "Set params error" + do_facet mgs $LCTL --device MGS llog_print $FSNAME-client | + grep 1.2.3.4@tcp || error "Fake nid should be added" cleanup load_modules @@ -9003,7 +9208,7 @@ test_125() echo "Before: ${facet} ${device} ${pre_max_sectors} ${max_hw_sectors}" - do_facet ${facet} "libtool execute l_tunedisk ${device}" + do_facet ${facet} "l_tunedisk ${device}" # Value after l_tunedisk local post_max_sectors=$(get_max_sectors_kb ${facet} ${device}) @@ -9079,6 +9284,119 @@ test_127() { } run_test 127 "direct io overwrite on full ost" +test_128() +{ + combined_mgs_mds && skip "need separate mgs device" + [ "$ost2_FSTYPE" == zfs ] && import_zpool ost2 + + format_ost 2 + # Try to apply nolocallogs to the virgin OST. Should fail. + do_facet ost2 "$TUNEFS --nolocallogs $(ostdevname 2)" && + error "nolocallogs should not be allowed on the virgin target" + + setupall + stopall + + [ "$ost1_FSTYPE" == zfs ] && import_zpool ost1 + # Start OST without MGS (local configs) + do_facet ost1 "$TUNEFS --dryrun $(ostdevname 1)" + start_ost || error "unable to start OST1" + stop_ost || error "Unable to stop OST1" + + [ "$ost1_FSTYPE" == zfs ] && import_zpool ost1 + # Do not allow reading local configs, should fail + do_facet ost1 "$TUNEFS --nolocallogs $(ostdevname 1)" || + error "Can not set nolocallogs" + start_ost && error "OST1 started, but should fail" + + # Connect to MGS successfully, reset nolocallogs flag + [ "$ost1_FSTYPE" == zfs ] && import_zpool ost1 + start_mgs || error "unable to start MGS" + start_ost || error "unable to start OST1" + + do_facet ost1 "$TUNEFS --dryrun $(ostdevname 1)" | grep "nolocallogs" && + error "nolocallogs expected to be reset" + + stop_ost || error "Unable to stop OST1" +} +run_test 128 "Force using remote logs with --nolocallogs" + +test_129() +{ + stopall + start_mds || error "MDS start failed" + format_ost 1 + start ost1 $(ostdevname 1) $OST_MOUNT_OPTS && + error "start ost1 should fail" || true + start ost1 $(ostdevname 1) $OST_MOUNT_OPTS && + error "second start ost1 should fail" || true + do_facet ost1 "$TUNEFS --writeconf $(ostdevname 1)" + start ost1 $(ostdevname 1) $OST_MOUNT_OPTS || + error "start ost1 failed" + stop ost1 + stop_mds +} +run_test 129 "attempt to connect an OST with the same index should fail" + +test_130() +{ + [ $MDSCOUNT -lt 2 ] && skip "needs >= 2 MDTs" + setupall + stop_mdt 2 || error "mdt2 stop failed" + do_facet mds2 "$TUNEFS --writeconf $(mdsdevname 2)" + start_mdt 2 || error "mdt2 start failed" + do_facet mds2 "$LCTL dl" | grep MDT0001-osp-MDT0001 && + error "Illegal OSP device created" || true +} +run_test 130 "re-register an MDT after writeconf" + +test_131() { + [ "$mds1_FSTYPE" == "ldiskfs" ] || skip "ldiskfs only test" + do_facet mds1 $DEBUGFS -R features $(mdsdevname 1) | + grep -q project || skip "skip project quota not supported" + + local projid + + setupall + test_mkdir -c $MDSCOUNT -p $DIR/$tdir + $LFS project -p 1000 $DIR/$tdir || error "set dir project id failed" + createmany -o $DIR/$tdir/f 512 + for ((i = 0; i < 512; ++i)); do + $LFS project -p $i $DIR/$tdir/f${i} || + error "set f${i} project id failed" + done + + test_mkdir -c $MDSCOUNT -p $DIR/$tdir.inherit + $LFS project -p 1001 -s $DIR/$tdir.inherit + createmany -o $DIR/$tdir.inherit/f 128 + (( $($LFS project $DIR/$tdir.inherit/f* | + awk '$1 == 1001 { print }' | wc -l) == 128 )) || + error "files did not inherit projid 1001" + + stopall + + for i in $(seq $MDSCOUNT); do + mds_backup_restore mds$i || + error "Backup/restore on mds$i failed" + done + + setupall + + projid=($($LFS project -d $DIR/$tdir)) + [ ${projid[0]} == "1000" ] || + error "projid expected 1000 not ${projid[0]}" + for ((i = 0; i < 512; ++i)); do + projid=($($LFS project $DIR/$tdir/f${i})) + [ ${projid[0]} == "$i" ] || + error "projid expected $i not ${projid[0]}" + done + + (( $($LFS project $DIR/$tdir.inherit/f* | + awk '$1 == 1001 { print }' | wc -l) == 128 )) || + error "restore did not copy projid 1001" +} +run_test 131 "MDT backup restore with project ID" + if ! combined_mgs_mds ; then stop mgs fi