From 1c2cd16eeb4d8647eb48d634c16c446a32e094df Mon Sep 17 00:00:00 2001 From: eeb Date: Sat, 2 Oct 2004 14:13:30 +0000 Subject: [PATCH] * Debugged sgpdd-survey multi-device support on Bull server --- lustre-iokit/sgpdd-survey/sgpdd-survey | 130 +++++++++++++++++++-------------- 1 file changed, 77 insertions(+), 53 deletions(-) diff --git a/lustre-iokit/sgpdd-survey/sgpdd-survey b/lustre-iokit/sgpdd-survey/sgpdd-survey index e42c84c..8f7cd1f 100755 --- a/lustre-iokit/sgpdd-survey/sgpdd-survey +++ b/lustre-iokit/sgpdd-survey/sgpdd-survey @@ -3,17 +3,17 @@ ###################################################################### # customize per survey -# the SG device to measure -dev=/dev/sg6 +# the SCSI devices to measure +scsidevs="/dev/sde /dev/sdh" # result file prefix # NB ensure the path exists if it includes subdirs rslt=/tmp/sg_dd_rslt # what to do (read or write) -action=write +actions="write read" -# total size (MBytes) +# total size per device (MBytes) # NB bigger than device cache is good size=8192 @@ -21,35 +21,41 @@ size=8192 rszlo=1024 rszhi=1024 -# Concurrent regions +# Concurrent regions per device crglo=1 -crghi=4 +crghi=128 -# total numbers of threads to share between concurrent regions +# threads to share between concurrent regions per device # NB survey skips over #thr < #regions thrlo=1 -thrhi=1024 +thrhi=128 ##################################################################### # disk block size (Bytes) bs=512 -if [ $action = read ]; then - f1="if=$dev" - f2="of=/dev/null" - skip=skip -else - f1="if=/dev/zero" - f2="of=$dev" - skip=seek -fi +# max # threads per individual sgp_dd instance +SG_MAX_QUEUE=16 + +i=0 +devs=() +for d in $scsidevs; do + devs[$i]=`sg_map | awk "{if ($ 2 == \"$d\") print $ 1}"` + if [ -z "$devs[$i]" ]; then + echo "Can't find SG device for $d" + exit 1 + fi + i=$((i+1)) +done +ndevs=${#devs[@]} start=`date +%F@%R` rsltf=${rslt}_${start}.summary echo -n > $rsltf workf=${rslt}_${start}.detail echo -n > $workf +tmpf=${rslt}_${start}.tmp print_summary () { if [ "$1" = "-n" ]; then @@ -64,7 +70,7 @@ print_summary () { for ((rsz=$rszlo;rsz<=$rszhi;rsz*=2)); do for ((crg=$crglo;crg<=$crghi;crg*=2)); do for ((thr=$thrlo;thr<=$thrhi;thr*=2)); do - if ((thr < crg)); then + if ((thr < crg || thr/crg > SG_MAX_QUEUE)); then continue fi # compute parameters @@ -75,48 +81,66 @@ for ((rsz=$rszlo;rsz<=$rszhi;rsz*=2)); do actual_rsz=$((bpt*bs/1024)) actual_size=$((bs*count*crg/1024)) str=`printf 'total_size %8dK rsz %4d crg %5d thr %3d ' \ - $actual_size $actual_rsz $crg $thr` + $((actual_size*ndevs)) $actual_rsz $((crg*ndevs)) $((thr*ndevs))` echo "==============> $str" >> $workf print_summary -n "$str" freemem=`awk < /proc/meminfo '/^MemTotal:/ {printf "%d\n", $2}'` - if (((actual_rsz * thr /crg + 64) * crg > freemem)); then + if (((actual_rsz*thr/crg + 64)*crg*ndevs > freemem)); then print_summary "ENOMEM" continue fi - # start test - t0=`date +%s.%N` - for ((i=0;i ${rslt}_tmp${i} \ - $f1 $f2 ${skip}=$((1024+i*blocks)) \ - thr=$((thr/crg)) count=$count bs=$bs bpt=$bpt time=1& - done - wait - t1=`date +%s.%N` - # collect all results in 1 file - rfile=${rslt}_thr${thr}_crg${crg}_rsz${rsz} - echo > $rfile - ok=0 - for ((i=0;i /dev/null 2>&1; then - ok=$((ok + 1)) + for action in $actions; do + print_summary -n "$action " + echo "=====> $action" >> $workf + # start test + t0=`date +%s.%N` + for ((i=0;i ${tmpf}_${i}_${j} \ + $inf $outf ${skip}=$((1024+j*blocks)) \ + thr=$((thr/crg)) count=$count bs=$bs bpt=$bpt time=1& + done + done + wait + t1=`date +%s.%N` + # collect all results in 1 file + echo > $tmpf + ok=0 + for ((i=0;i /dev/null 2>&1; then + ok=$((ok + 1)) + fi + cat ${rtmp} >> $tmpf + cat ${rtmp} >> $workf + rm ${rtmp} + done + done + if ((ok != ndevs*crg)); then + print_summary -n "$((ndevs*crg - ok)) failed " + else + # compute MB/sec from elapsed + bw=`awk "BEGIN {printf \"%7.2f MB/s\", $actual_size / (( $t1 - $t0 ) * 1024); exit}"` + # compute MB/sec from nregions*slowest + check=`awk < $tmpf \ + '/time to transfer data/ {mb=$8/1.048576; if (n == 0 || mb < min) min = mb; n++}\ + END {printf "%3d x %6.2f = %7.2f MB/s", n, min, min * n}'` + print_summary -n "$bw $check " fi - cat ${rslt}_tmp${i} >> $rfile - cat ${rslt}_tmp${i} >> $workf - rm ${rslt}_tmp${i} + rm $tmpf done - if [ $ok -ne $crg ]; then - print_summary `printf "failed %d" $((crg - ok))` - else - # compute MB/sec from elapsed - bw=`awk "BEGIN {printf \"%6.2f MB/s\", $actual_size / (( $t1 - $t0 ) * 1024); exit}"` - # compute MB/sec from nregions*slowest - check=`awk < $rfile \ - '/time to transfer data/ {mb=$8/1.048576; if (n == 0 || mb < min) min = mb; n++}\ - END {printf "%3d x %6.2f = %6.2f MB/s", n, min, min * n}'` - print_summary "$bw $check" - fi - rm $rfile + print_summary "" done done -done +done \ No newline at end of file -- 1.8.3.1