5 LUSTRE=${LUSTRE:-$(cd $(dirname $0)/..; echo $PWD)}
6 . $LUSTRE/tests/test-framework.sh
8 . ${CONFIG:=$LUSTRE/tests/cfg/$NAME.sh}
12 ALWAYS_EXCEPT="parallel_grouplock statahead $PARALLEL_SCALE_EXCEPT"
17 cbench_DIR=${cbench_DIR:-""}
18 cbench_IDIRS=${cbench_IDIRS:-4}
19 cbench_RUNS=${cbench_RUNS:-4} # FIXME: wiki page requirements is 30, do we really need 30 ?
21 if [ "$SLOW" = "no" ]; then
29 METABENCH=${METABENCH:-$(which metabench 2> /dev/null || true)}
30 mbench_NFILES=${mbench_NFILES:-30400}
31 [ "$SLOW" = "no" ] && mbench_NFILES=10000
32 MACHINEFILE=${MACHINEFILE:-$TMP/$(basename $0 .sh).machines}
34 mbench_THREADS=${mbench_THREADS:-4}
39 SIMUL=${SIMUL:=$(which simul 2> /dev/null || true)}
41 simul_THREADS=${simul_THREADS:-2}
42 simul_REP=${simul_REP:-20}
43 [ "$SLOW" = "no" ] && simul_REP=2
48 cnt_DIR=${cnt_DIR:-""}
49 cnt_NRUN=${cnt_NRUN:-10}
50 [ "$SLOW" = "no" ] && cnt_NRUN=2
55 CASC_RW=${CASC_RW:-$(which cascading_rw 2> /dev/null || true)}
57 casc_THREADS=${casc_THREADS:-2}
58 casc_REP=${casc_REP:-300}
59 [ "$SLOW" = "no" ] && casc_REP=10
64 IOR=${IOR:-$(which IOR 2> /dev/null || true)}
66 ior_THREADS=${ior_THREADS:-2}
67 ior_blockSize=${ior_blockSize:-6} # Gb
68 ior_DURATION=${ior_DURATION:-30} # minutes
69 [ "$SLOW" = "no" ] && ior_DURATION=5
72 # write_append_truncate
75 write_THREADS=${write_THREADS:-8}
76 write_REP=${write_REP:-10000}
77 [ "$SLOW" = "no" ] && write_REP=100
82 WRITE_DISJOINT=${WRITE_DISJOINT:-$(which write_disjoint 2> /dev/null || true)}
84 wdisjoint_THREADS=${wdisjoint_THREADS:-4}
85 wdisjoint_REP=${wdisjoint_REP:-10000}
86 [ "$SLOW" = "no" ] && wdisjoint_REP=100
92 PARALLEL_GROUPLOCK=${PARALLEL_GROUPLOCK:-$(which parallel_grouplock 2> /dev/null || true)}
93 parallel_grouplock_MINTASKS=${parallel_grouplock_MINTASKS:-5}
96 check_and_setup_lustre
98 get_mpiuser_id $MPI_USER
99 MPI_RUNAS=${MPI_RUNAS:-"runas -u $MPI_USER_UID -g $MPI_USER_GID"}
100 $GSS_KRB5 && refresh_krb5_tgt $MPI_USER_UID $MPI_USER_GID $MPI_RUNAS
109 echo "${var}=${!var}"
111 [ -e $MACHINEFILE ] && cat $MACHINEFILE
115 # 5 min * cbench_RUNS
119 # compile dir kernel-1 680MB
120 # required space 680MB * cbench_IDIRS = ~7 Gb
122 test_compilebench() {
123 print_opts cbench_DIR cbench_IDIRS cbench_RUNS
125 [ x$cbench_DIR = x ] &&
126 { skip_env "compilebench not found" && return; }
128 [ -e $cbench_DIR/compilebench ] || \
129 { skip_env "No compilebench build" && return; }
131 local space=$(df -P $DIR | tail -n 1 | awk '{ print $4 }')
132 if [ $space -le $((680 * 1024 * cbench_IDIRS)) ]; then
133 cbench_IDIRS=$(( space / 680 / 1024))
134 [ $cbench_IDIRS = 0 ] && \
135 skip_env "Need free space atleast 680 Mb, have $space" && return
137 log free space=$space, reducing initial dirs to $cbench_IDIRS
140 # t-f _base needs to be modifyed to set properly tdir
141 # for new "test_foo" functions names
142 # local testdir=$DIR/$tdir
143 local testdir=$DIR/d0.compilebench
148 local cmd="./compilebench -D $testdir -i $cbench_IDIRS -r $cbench_RUNS --makej"
157 [ $rc = 0 ] || error "compilebench failed: $rc"
160 run_test compilebench "compilebench"
163 [ x$METABENCH = x ] &&
164 { skip_env "metabench not found" && return; }
166 local clients=$CLIENTS
167 [ -z $clients ] && clients=$(hostname)
169 num_clients=$(get_node_count ${clients//,/ })
172 # Need space estimation here.
174 generate_machine_file $clients $MACHINEFILE || \
175 error "can not generate machinefile $MACHINEFILE"
177 print_opts METABENCH clients mbench_NFILES mbench_THREADS
179 local testdir=$DIR/d0.metabench
181 # mpi_run uses mpiuser
184 # -C Run the file creation tests.
185 # -S Run the file stat tests.
186 # -c nfile Number of files to be used in each test.
187 # -k Cleanup. Remove the test directories.
188 local cmd="$METABENCH -w $testdir -c $mbench_NFILES -C -S -k"
190 mpi_run -np $((num_clients * $mbench_THREADS)) -machinefile ${MACHINEFILE} $cmd
192 if [ $rc != 0 ] ; then
193 error "metabench failed! $rc"
197 run_test metabench "metabench"
200 if [ "$NFSCLIENT" ]; then
201 skip "skipped for NFSCLIENT mode"
206 { skip_env "simul not found" && return; }
208 local clients=$CLIENTS
209 [ -z $clients ] && clients=$(hostname)
211 local num_clients=$(get_node_count ${clients//,/ })
214 # Need space estimation here.
216 generate_machine_file $clients $MACHINEFILE || \
217 error "can not generate machinefile $MACHINEFILE"
219 print_opts SIMUL clients simul_REP simul_THREADS
221 local testdir=$DIR/d0.simul
223 # mpi_run uses mpiuser
226 # -n # : repeat each test # times
227 # -N # : repeat the entire set of tests # times
229 local cmd="$SIMUL -d $testdir -n $simul_REP -N $simul_REP"
232 mpi_run -np $((num_clients * $simul_THREADS)) -machinefile ${MACHINEFILE} $cmd
235 if [ $rc != 0 ] ; then
236 error "simul failed! $rc"
240 run_test simul "simul"
242 test_connectathon() {
243 print_opts cnt_DIR cnt_NRUN
246 { skip_env "connectathon dir not found" && return; }
248 [ -e $cnt_DIR/runtests ] || \
249 { skip_env "No connectathon runtests found" && return; }
251 local testdir=$DIR/d0.connectathon
257 # -f a quick functionality test
258 # -a run basic, general, special, and lock tests
259 # -N numpasses - will be passed to the runtests script. This argument
260 # is optional. It specifies the number of times to run
263 local cmd="./runtests -N $cnt_NRUN -a -f $testdir"
272 [ $rc = 0 ] || error "connectathon failed: $rc"
275 run_test connectathon "connectathon"
279 { skip_env "IOR not found" && return; }
281 local clients=$CLIENTS
282 [ -z $clients ] && clients=$(hostname)
284 local num_clients=$(get_node_count ${clients//,/ })
286 local space=$(df -P $DIR | tail -n 1 | awk '{ print $4 }')
287 echo "+ $ior_blockSize * 1024 * 1024 * $num_clients * $ior_THREADS "
288 if [ $((space / 2)) -le $(( ior_blockSize * 1024 * 1024 * num_clients * ior_THREADS)) ]; then
289 echo "+ $space * 9/10 / 1024 / 1024 / $num_clients / $ior_THREADS"
290 ior_blockSize=$(( space /2 /1024 /1024 / num_clients / ior_THREADS ))
291 [ $ior_blockSize = 0 ] && \
292 skip_env "Need free space more than ($num_clients * $ior_THREADS )Gb: $((num_clients*ior_THREADS *1024 *1024*2)), have $space" && return
294 echo "free space=$space, Need: $num_clients x $ior_THREADS x $ior_blockSize Gb (blockSize reduced to $ior_blockSize Gb)"
297 generate_machine_file $clients $MACHINEFILE || \
298 error "can not generate machinefile $MACHINEFILE"
300 print_opts IOR ior_THREADS ior_DURATION MACHINEFILE
302 local testdir=$DIR/d0.ior
304 # mpi_run uses mpiuser
306 if [ "$NFSCLIENT" ]; then
307 setstripe_nfsserver $testdir -c -1 ||
308 { error "setstripe on nfsserver failed" && return 1; }
310 $LFS setstripe $testdir -c -1 ||
311 { error "setstripe failed" && return 2; }
314 # -b N blockSize -- contiguous bytes to write per task (e.g.: 8, 4k, 2m, 1g)"
316 # -t N transferSize -- size of transfer in bytes (e.g.: 8, 4k, 2m, 1g)"
317 # -w writeFile -- write file"
318 # -r readFile -- read existing file"
319 # -T maxTimeDuration -- max time in minutes to run tests"
320 # -k keepFile -- keep testFile(s) on program exit
321 local cmd="$IOR -a POSIX -b ${ior_blockSize}g -o $testdir/iorData -t 2m -v -w -r -T $ior_DURATION -k"
324 mpi_run -np $((num_clients * $ior_THREADS)) -machinefile ${MACHINEFILE} $cmd
327 if [ $rc != 0 ] ; then
328 error "ior failed! $rc"
334 test_cascading_rw() {
335 if [ "$NFSCLIENT" ]; then
336 skip "skipped for NFSCLIENT mode"
341 { skip_env "cascading_rw not found" && return; }
343 local clients=$CLIENTS
344 [ -z $clients ] && clients=$(hostname)
346 num_clients=$(get_node_count ${clients//,/ })
349 # Need space estimation here.
351 generate_machine_file $clients $MACHINEFILE || \
352 error "can not generate machinefile $MACHINEFILE"
354 print_opts CASC_RW clients casc_THREADS casc_REP MACHINEFILE
356 local testdir=$DIR/d0.cascading_rw
358 # mpi_run uses mpiuser
362 # -n: repeat test # times
364 local cmd="$CASC_RW -g -d $testdir -n $casc_REP"
367 mpi_run -np $((num_clients * $casc_THREADS)) -machinefile ${MACHINEFILE} $cmd
370 if [ $rc != 0 ] ; then
371 error "cascading_rw failed! $rc"
375 run_test cascading_rw "cascading_rw"
377 test_write_append_truncate() {
378 if [ "$NFSCLIENT" ]; then
379 skip "skipped for NFSCLIENT mode"
383 # location is lustre/tests dir
384 if ! which write_append_truncate > /dev/null 2>&1 ; then
385 skip_env "write_append_truncate not found"
389 local clients=$CLIENTS
390 [ -z $clients ] && clients=$(hostname)
392 local num_clients=$(get_node_count ${clients//,/ })
395 # Need space estimation here.
397 generate_machine_file $clients $MACHINEFILE || \
398 error "can not generate machinefile $MACHINEFILE"
400 local testdir=$DIR/d0.write_append_truncate
401 local file=$testdir/f0.wat
403 print_opts clients write_REP write_THREADS MACHINEFILE
406 # mpi_run uses mpiuser
409 local cmd="write_append_truncate -n $write_REP $file"
412 mpi_run -np $((num_clients * $write_THREADS)) -machinefile ${MACHINEFILE} $cmd
415 if [ $rc != 0 ] ; then
416 error "write_append_truncate failed! $rc"
421 run_test write_append_truncate "write_append_truncate"
423 test_write_disjoint() {
424 if [ "$NFSCLIENT" ]; then
425 skip "skipped for NFSCLIENT mode"
429 [ x$WRITE_DISJOINT = x ] &&
430 { skip_env "write_disjoint not found" && return; }
432 local clients=$CLIENTS
433 [ -z $clients ] && clients=$(hostname)
435 local num_clients=$(get_node_count ${clients//,/ })
438 # Need space estimation here.
440 generate_machine_file $clients $MACHINEFILE || \
441 error "can not generate machinefile $MACHINEFILE"
443 print_opts WRITE_DISJOINT clients wdisjoint_THREADS wdisjoint_REP MACHINEFILE
444 local testdir=$DIR/d0.write_disjoint
446 # mpi_run uses mpiuser
449 local cmd="$WRITE_DISJOINT -f $testdir/file -n $wdisjoint_REP"
452 mpi_run -np $((num_clients * $wdisjoint_THREADS)) -machinefile ${MACHINEFILE} $cmd
455 if [ $rc != 0 ] ; then
456 error "write_disjoint failed! $rc"
460 run_test write_disjoint "write_disjoint"
462 test_parallel_grouplock() {
463 [ x$PARALLEL_GROUPLOCK = x ] &&
464 { skip "PARALLEL_GROUPLOCK not found" && return; }
466 local clients=$CLIENTS
467 [ -z $clients ] && clients=$(hostname)
469 local num_clients=$(get_node_count ${clients//,/ })
471 generate_machine_file $clients $MACHINEFILE || \
472 error "can not generate machinefile $MACHINEFILE"
474 print_opts clients parallel_grouplock_MINTASKS MACHINEFILE
476 local testdir=$DIR/d0.parallel_grouplock
478 # mpi_run uses mpiuser
481 do_nodes $clients "lctl set_param llite.*.max_rw_chunk=0" ||
482 error "set_param max_rw_chunk=0 failed "
487 for i in $(seq 12); do
489 local cmd="$PARALLEL_GROUPLOCK -g -v -d $testdir $subtest"
492 mpi_run -np $parallel_grouplock_MINTASKS -machinefile ${MACHINEFILE} $cmd
494 if [ $rc != 0 ] ; then
495 error_noexit "parallel_grouplock subtests $subtest failed! $rc"
497 echo "parallel_grouplock subtests $subtest PASS"
499 let status=$((status + rc))
500 # clear debug to collect one log per one test
501 do_nodes $(comma_list $(nodes_list)) lctl clear
503 [ $status -eq 0 ] || error "parallel_grouplock status: $status"
506 run_test parallel_grouplock "parallel_grouplock"
508 statahead_NUMMNTPTS=${statahead_NUMMNTPTS:-5}
509 statahead_NUMFILES=${statahead_NUMFILES:-500000}
511 cleanup_statahead () {
518 for i in $(seq 0 $num_mntpts);do
519 zconf_umount_clients $clients ${mntpt_root}$i ||
520 error_exit "Failed to umount lustre on ${mntpt_root}$i"
528 local dir=d0.statahead
529 # FIXME has to use DIR
530 local testdir=$DIR/$dir
534 local num_files=$statahead_NUMFILES
536 local IFree=$(inodes_available)
537 if [ $IFree -lt $num_files ]; then
543 log "createmany -o $testdir/f-%d $num_files"
544 createmany -o $testdir/$f-%d $num_files
547 if [ $rc != 0 ] ; then
548 error "createmany failed to create $rc"
552 local num_mntpts=$statahead_NUMMNTPTS
553 local mntpt_root=$TMP/mntpt/lustre
554 mntopts=${MNTOPTSTATAHEAD:-$MOUNTOPT}
556 local clients=$CLIENTS
557 [ -z $clients ] && clients=$(hostname)
559 echo "Mounting $num_mntpts lustre clients starts on $clients"
560 trap "cleanup_statahead $clients $mntpt_root $num_mntpts" EXIT ERR
561 for i in $(seq 0 $num_mntpts);do
562 zconf_mount_clients $clients ${mntpt_root}$i $mntopts ||
563 error_exit "Failed to mount lustre on ${mntpt_root}$i on $clients"
566 do_rpc_nodes $clients cancel_lru_locks mdc
568 do_rpc_nodes $clients do_ls $mntpt_root $num_mntpts $dir
570 cleanup_statahead $clients $mntpt_root $num_mntpts
573 run_test statahead "statahead test, multiple clients"
575 equals_msg `basename $0`: test complete, cleaning up
576 check_and_cleanup_lustre
577 [ -f "$TESTSUITELOG" ] && cat $TESTSUITELOG && grep -q FAIL $TESTSUITELOG && exit 1 || true