129921a8fSScott Kruger 229921a8fSScott Kruger 329921a8fSScott Krugerscriptname=`basename $0` 429921a8fSScott Krugerrundir=${scriptname%.sh} 534929e0eSSatish BalayTIMEOUT=60 629921a8fSScott Kruger 729921a8fSScott Krugerif test "$PWD"!=`dirname $0`; then 829921a8fSScott Kruger cd `dirname $0` 9aec279ffSScott Kruger abspath_scriptdir=$PWD 1029921a8fSScott Krugerfi 116c91caf2SScott Krugerif test -d "${rundir}" && test -n "${rundir}"; then 1247e61e69SScott Kruger rm -f ${rundir}/*.tmp ${rundir}/*.err ${rundir}/*.out 136c91caf2SScott Krugerfi 1429921a8fSScott Krugermkdir -p ${rundir} 1580a579ceSSatish Balayif test -n "${runfiles}"; then 1680a579ceSSatish Balay for runfile in ${runfiles}; do 1780a579ceSSatish Balay subdir=`dirname ${runfile}` 1880a579ceSSatish Balay mkdir -p ${rundir}/${subdir} 1980a579ceSSatish Balay cp -r ${runfile} ${rundir}/${subdir} 2080a579ceSSatish Balay done 21d7871bd4SScott Krugerfi 2229921a8fSScott Krugercd ${rundir} 2329921a8fSScott Kruger 2429921a8fSScott Kruger# 2529921a8fSScott Kruger# Method to print out general and script specific options 2629921a8fSScott Kruger# 2729921a8fSScott Krugerprint_usage() { 2829921a8fSScott Kruger 2929921a8fSScott Krugercat >&2 <<EOF 3029921a8fSScott KrugerUsage: $0 [options] 3129921a8fSScott Kruger 3229921a8fSScott KrugerOPTIONS 3329921a8fSScott Kruger -a <args> ......... Override default arguments 34aec279ffSScott Kruger -c ................ Cleanup (remove generated files) 35aec279ffSScott Kruger -C ................ Compile 36e53dc769SScott Kruger -d ................ Launch in debugger 3729921a8fSScott Kruger -e <args> ......... Add extra arguments to default 382f2809e3SToby Isaac -f ................ force attempt to run test that would otherwise be skipped 3929921a8fSScott Kruger -h ................ help: print this message 4029921a8fSScott Kruger -n <integer> ...... Override the number of processors to use 41ba2c5286SScott Kruger -j ................ Pass -j to petscdiff (just use diff) 42ba2c5286SScott Kruger -J <arg> .......... Pass -J to petscdiff (just use diff with arg) 43ba2c5286SScott Kruger -m ................ Update results using petscdiff 44f50802fbSScott Kruger -M ................ Update alt files using petscdiff 455e361860SScott Kruger -o <arg> .......... Output format: 'interactive', 'err_only' 46a6f3f80dSScott Kruger -p ................ Print command: Print first command and exit 470a091e3eSScott Kruger -t ................ Override the default timeout (default=$TIMEOUT sec) 48baa5c0f4SScott Kruger -U ................ run cUda-memcheck 49b047ed2bSScott Kruger -V ................ run Valgrind 5029921a8fSScott Kruger -v ................ Verbose: Print commands 5129921a8fSScott KrugerEOF 5229921a8fSScott Kruger 5329921a8fSScott Kruger if declare -f extrausage > /dev/null; then extrausage; fi 5429921a8fSScott Kruger exit $1 5529921a8fSScott Kruger} 5629921a8fSScott Kruger### 5729921a8fSScott Kruger## Arguments for overriding things 5829921a8fSScott Kruger# 595e361860SScott Krugeroutput_fmt="interactive" 6029921a8fSScott Krugerverbose=false 6129921a8fSScott Krugercleanup=false 62aec279ffSScott Krugercompile=false 63e53dc769SScott Krugerdebugger=false 64a6f3f80dSScott Krugerprintcmd=false 6563cf4119SScott Krugermpiexec_function=false 662f2809e3SToby Isaacforce=false 67d4417257SScott Krugerdiff_flags="" 68baa5c0f4SScott Krugerwhile getopts "a:cCde:fhjJ:mMn:o:pt:UvV" arg 6929921a8fSScott Krugerdo 7029921a8fSScott Kruger case $arg in 71ba2c5286SScott Kruger a ) args="$OPTARG" ;; 7229921a8fSScott Kruger c ) cleanup=true ;; 73aec279ffSScott Kruger C ) compile=true ;; 74e53dc769SScott Kruger d ) debugger=true ;; 75ba2c5286SScott Kruger e ) extra_args="$OPTARG" ;; 762f2809e3SToby Isaac f ) force=true ;; 7729921a8fSScott Kruger h ) print_usage; exit ;; 78ba2c5286SScott Kruger n ) nsize="$OPTARG" ;; 7929dac19bSScott Kruger j ) diff_flags=$diff_flags" -j" ;; 8029dac19bSScott Kruger J ) diff_flags=$diff_flags" -J $OPTARG" ;; 8129dac19bSScott Kruger m ) diff_flags=$diff_flags" -m" ;; 8229dac19bSScott Kruger M ) diff_flags=$diff_flags" -M" ;; 835e361860SScott Kruger o ) output_fmt=$OPTARG ;; 84a6f3f80dSScott Kruger p ) printcmd=true ;; 850a091e3eSScott Kruger t ) TIMEOUT=$OPTARG ;; 8663cf4119SScott Kruger U ) mpiexec="petsc_mpiexec_cudamemcheck $mpiexec" 8763cf4119SScott Kruger mpiexec_function=true 8863cf4119SScott Kruger ;; 8963cf4119SScott Kruger V ) mpiexec="petsc_mpiexec_valgrind $mpiexec" 9063cf4119SScott Kruger mpiexec_function=true 9163cf4119SScott Kruger ;; 9229921a8fSScott Kruger v ) verbose=true ;; 9329921a8fSScott Kruger *) # To take care of any extra args 9429921a8fSScott Kruger if test -n "$OPTARG"; then 9529921a8fSScott Kruger eval $arg=\"$OPTARG\" 9629921a8fSScott Kruger else 9729921a8fSScott Kruger eval $arg=found 9829921a8fSScott Kruger fi 9929921a8fSScott Kruger ;; 10029921a8fSScott Kruger esac 10129921a8fSScott Krugerdone 10229921a8fSScott Krugershift $(( $OPTIND - 1 )) 10329921a8fSScott Kruger 1040a091e3eSScott Kruger# Individual tests can extend the default 10575ea7643SJed Brownexport MPIEXEC_TIMEOUT=$((TIMEOUT*timeoutfactor)) 106bbf1c217SScott KrugerSTARTTIME=`date +%s` 1070a091e3eSScott Kruger 10829921a8fSScott Krugerif test -n "$extra_args"; then 10929921a8fSScott Kruger args="$args $extra_args" 11029921a8fSScott Krugerfi 111e53dc769SScott Krugerif $debugger; then 112e53dc769SScott Kruger args="-start_in_debugger $args" 113e53dc769SScott Krugerfi 1141725bfbfSScott Krugerif test -n "$filter"; then 1151725bfbfSScott Kruger diff_flags=$diff_flags" -F \$'$filter'" 1161725bfbfSScott Krugerfi 1171725bfbfSScott Krugerif test -n "$filter_output"; then 1181725bfbfSScott Kruger diff_flags=$diff_flags" -f \$'$filter_output'" 1191725bfbfSScott Krugerfi 120e53dc769SScott Kruger 12129921a8fSScott Kruger 12229921a8fSScott Kruger# Init 12329921a8fSScott Krugersuccess=0; failed=0; failures=""; rmfiles="" 12429921a8fSScott Krugertotal=0 12529921a8fSScott Krugertodo=-1; skip=-1 1260a091e3eSScott Krugerjob_level=0 12729921a8fSScott Kruger 12863cf4119SScott Krugerif $compile; then 12963cf4119SScott Kruger curexec=`basename ${exec}` 13063cf4119SScott Kruger fullexec=${abspath_scriptdir}/${curexec} 13156fc7296SScott Kruger maketarget=`echo ${fullexec} | sed "s#${petsc_dir}/*##"` 13263cf4119SScott Kruger (cd $petsc_dir && make -f gmakefile.test ${maketarget}) 13363cf4119SScott Krugerfi 13463cf4119SScott Kruger 13563cf4119SScott Kruger### 13663cf4119SScott Kruger## Rest of code is functions 13763cf4119SScott Kruger# 1385e361860SScott Krugerfunction petsc_report_tapoutput() { 1395e361860SScott Kruger notornot=$1 1405e361860SScott Kruger test_label=$2 1415e361860SScott Kruger comment=$3 1425e361860SScott Kruger if test -n "$comment"; then 1435e361860SScott Kruger comment=" # ${comment}" 1445e361860SScott Kruger fi 1455e361860SScott Kruger 1465e361860SScott Kruger tap_message="${notornot} ok ${test_label}${comment}" 1475e361860SScott Kruger 1485e361860SScott Kruger # Log messages 1495e361860SScott Kruger printf "${tap_message}\n" >> ${testlogtapfile} 1505e361860SScott Kruger 1515e361860SScott Kruger if test ${output_fmt} == "err_only"; then 1525e361860SScott Kruger if test -n "${notornot}"; then 1535e361860SScott Kruger printf "${tap_message}\n" | tee -a ${testlogerrfile} 1545e361860SScott Kruger fi 1555e361860SScott Kruger else 1565e361860SScott Kruger printf "${tap_message}\n" 1575e361860SScott Kruger fi 1585e361860SScott Kruger} 1595e361860SScott Kruger 160a6f3f80dSScott Krugerfunction printcmd() { 161a6f3f80dSScott Kruger # Print command that can be run from PETSC_DIR 162a6f3f80dSScott Kruger cmd="$1" 163a6f3f80dSScott Kruger basedir=`dirname ${PWD} | sed "s#${petsc_dir}/##"` 164581cb8b0SStefano Zampini modcmd=`echo ${cmd} | sed -e "s#\.\.#${basedir}#" | sed s#\>.*## | sed s#\%#\%\%#` 16563cf4119SScott Kruger if $mpiexec_function; then 1660a6ed61bSStefano Zampini # Have to expand valgrind/cudamemcheck 16763cf4119SScott Kruger modcmd=`eval "$modcmd"` 16863cf4119SScott Kruger fi 169a6f3f80dSScott Kruger printf "${modcmd}\n" 170a6f3f80dSScott Kruger exit 171a6f3f80dSScott Kruger} 172a6f3f80dSScott Kruger 17329921a8fSScott Krugerfunction petsc_testrun() { 17429921a8fSScott Kruger # First arg = Basic command 17529921a8fSScott Kruger # Second arg = stdout file 17629921a8fSScott Kruger # Third arg = stderr file 17729921a8fSScott Kruger # Fourth arg = label for reporting 17829921a8fSScott Kruger rmfiles="${rmfiles} $2 $3" 17929921a8fSScott Kruger tlabel=$4 1801725bfbfSScott Kruger error=$5 18129921a8fSScott Kruger cmd="$1 > $2 2> $3" 1821725bfbfSScott Kruger if test -n "$error"; then 1830e86256eSScott Kruger cmd="$1 1> $2 2>&1" 18429921a8fSScott Kruger fi 1851263882eSScott Kruger echo "$cmd" > ${tlabel}.sh; chmod 755 ${tlabel}.sh 186a6f3f80dSScott Kruger if $printcmd; then 187a6f3f80dSScott Kruger printcmd "$cmd" 188a6f3f80dSScott Kruger fi 1897a853109SScott Kruger 190d8e31410SScott Kruger eval "{ time -p $cmd ; } 2>> timing.out" 191679e9f5cSJed Brown cmd_res=$? 1920e86256eSScott Kruger # If testing the error output then we don't test the error code itself 1930e86256eSScott Kruger if test -n "$error"; then 1940e86256eSScott Kruger cmd_res=0 1950e86256eSScott Kruger fi 196ffc4695bSBarry Smith # If it is a lack of GPU resources or MPI failure (Intel) then try once more 197e57d7714SBarry Smith # See: src/sys/error/err.c 198601ce43eSScott Kruger # Error #134 added to handle problems with the Radeon card for hip testing 199601ce43eSScott Kruger if [ $cmd_res -eq 96 -o $cmd_res -eq 97 -o $cmd_res -eq 98 -o $cmd_res -eq 134 ]; then 20028f1f2fbSBarry Smith printf "# retrying ${tlabel}\n" | tee -a ${testlogerrfile} 20128f1f2fbSBarry Smith sleep 3 202e57d7714SBarry Smith eval "{ time -p $cmd ; } 2>> timing.out" 203e57d7714SBarry Smith cmd_res=$? 204e57d7714SBarry Smith fi 2050da08ecbSSatish Balay touch "$2" "$3" 206d5b43468SJose E. Roman # It appears current MPICH and Open MPI just shut down the job execution and do not return an error code to the executable 20728f1f2fbSBarry Smith # ETIMEDOUT=110 was used by Open MPI 3.0. MPICH used 255 20828f1f2fbSBarry Smith # Earlier Open MPI versions returned 1 and the error string 2097c0e31c5SScott Kruger if [ $cmd_res -eq 110 -o $cmd_res -eq 255 ] || \ 210ef0d7cd8SPierre Jolivet grep -F -q -s 'APPLICATION TIMED OUT' "$2" "$3" || \ 211ef0d7cd8SPierre Jolivet grep -F -q -s MPIEXEC_TIMEOUT "$2" "$3" || \ 212ef0d7cd8SPierre Jolivet grep -F -q -s 'APPLICATION TERMINATED WITH THE EXIT STRING: job ending due to timeout' "$2" "$3" || \ 2138fb2ab26SSatish Balay grep -q -s "Timeout after [0-9]* seconds. Terminating job" "$2" "$3"; then 214984117c4SJed Brown timed_out=1 2157c0e31c5SScott Kruger # If timed out, then ensure non-zero error code 2167c0e31c5SScott Kruger if [ $cmd_res -eq 0 ]; then 2177c0e31c5SScott Kruger cmd_res=1 2187c0e31c5SScott Kruger fi 219984117c4SJed Brown fi 2200a091e3eSScott Kruger 2210a091e3eSScott Kruger # Report errors 2225e361860SScott Kruger comment="" 2237a853109SScott Kruger if test $cmd_res == 0; then 22402afe9ecSJed Brown if "${verbose}"; then 2255e361860SScott Kruger comment="${cmd}" 22602afe9ecSJed Brown fi 2275e361860SScott Kruger petsc_report_tapoutput "" "$tlabel" "$comment" 22829921a8fSScott Kruger let success=$success+1 22929921a8fSScott Kruger else 2304d9d3ee5SSatish Balay if [ -n "$timed_out" ]; then 2315e361860SScott Kruger comment="Exceeded timeout limit of $MPIEXEC_TIMEOUT s" 2324d9d3ee5SSatish Balay else 2335e361860SScott Kruger comment="Error code: ${cmd_res}" 23464ca018dSScott Kruger fi 2355e361860SScott Kruger petsc_report_tapoutput "not" "$tlabel" "$comment" 2365e361860SScott Kruger 2375e361860SScott Kruger # Report errors in detail 2385e361860SScott Kruger if [ -z "$timed_out" ]; then 239570dea68SScott Kruger # We've had tests fail but stderr->stdout, as well as having 240570dea68SScott Kruger # mpi_abort go to stderr which throws this test off. Show both 241570dea68SScott Kruger # with stdout first 2425e361860SScott Kruger awk '{print "#\t" $0}' < $2 | tee -a ${testlogerrfile} 24329dac19bSScott Kruger # if statement is for diff tests 24429dac19bSScott Kruger if test "$2" != "$3"; then 245570dea68SScott Kruger awk '{print "#\t" $0}' < $3 | tee -a ${testlogerrfile} 246984117c4SJed Brown fi 24729dac19bSScott Kruger fi 24829921a8fSScott Kruger let failed=$failed+1 24929921a8fSScott Kruger failures="$failures $tlabel" 25029921a8fSScott Kruger fi 25129921a8fSScott Kruger let total=$success+$failed 2527a853109SScott Kruger return $cmd_res 25329921a8fSScott Kruger} 25429921a8fSScott Kruger 25529921a8fSScott Krugerfunction petsc_testend() { 25629921a8fSScott Kruger logfile=$1/counts/${label}.counts 25729921a8fSScott Kruger logdir=`dirname $logfile` 25829921a8fSScott Kruger if ! test -d "$logdir"; then 25929921a8fSScott Kruger mkdir -p $logdir 26029921a8fSScott Kruger fi 26129921a8fSScott Kruger if ! test -e "$logfile"; then 26229921a8fSScott Kruger touch $logfile 26329921a8fSScott Kruger fi 26429921a8fSScott Kruger printf "total $total\n" > $logfile 26529921a8fSScott Kruger printf "success $success\n" >> $logfile 26629921a8fSScott Kruger printf "failed $failed\n" >> $logfile 26729921a8fSScott Kruger printf "failures $failures\n" >> $logfile 26829921a8fSScott Kruger if test ${todo} -gt 0; then 26929921a8fSScott Kruger printf "todo $todo\n" >> $logfile 27029921a8fSScott Kruger fi 27129921a8fSScott Kruger if test ${skip} -gt 0; then 27229921a8fSScott Kruger printf "skip $skip\n" >> $logfile 27329921a8fSScott Kruger fi 274bbf1c217SScott Kruger ENDTIME=`date +%s` 275f53b81b6SPierre Jolivet timing=`touch timing.out && grep -E '(user|sys)' timing.out | awk '{if( sum1 == "" || $2 > sum1 ) { sum1=sprintf("%.2f",$2) } ; sum2 += sprintf("%.2f",$2)} END {printf "%.2f %.2f\n",sum1,sum2}'` 276521be42fSScott Kruger printf "time $timing\n" >> $logfile 27729921a8fSScott Kruger if $cleanup; then 27829921a8fSScott Kruger echo "Cleaning up" 27929921a8fSScott Kruger /bin/rm -f $rmfiles 28029921a8fSScott Kruger fi 28129921a8fSScott Kruger} 282296e37cfSJed Brown 283baa5c0f4SScott Krugerfunction petsc_mpiexec_cudamemcheck() { 284636bfc99SJacob Faibussowitsch # loops over the argument list to find the call to the test executable and insert the 285636bfc99SJacob Faibussowitsch # cuda memcheck command before it. 286636bfc99SJacob Faibussowitsch # first check if compute-sanitizer exists, since cuda-memcheck is deprecated from CUDA 287636bfc99SJacob Faibussowitsch # 11-ish onwards 288636bfc99SJacob Faibussowitsch if command -v compute-sanitizer &> /dev/null; then 289636bfc99SJacob Faibussowitsch memcheck_cmd="${PETSC_CUDAMEMCHECK_COMMAND:-compute-sanitizer}" 290636bfc99SJacob Faibussowitsch declare -a default_args_to_check=('--target-processes all' '--track-stream-ordered-races all') 291636bfc99SJacob Faibussowitsch else 292636bfc99SJacob Faibussowitsch memcheck_cmd="${PETSC_CUDAMEMCHECK_COMMAND:-cuda-memcheck}" 293636bfc99SJacob Faibussowitsch declare -a default_args_to_check=('--flush-to-disk yes') 294636bfc99SJacob Faibussowitsch fi 295636bfc99SJacob Faibussowitsch if [[ -z ${PETSC_CUDAMEMCHECK_ARGS} ]]; then 296636bfc99SJacob Faibussowitsch # if user has not set the memcheck args themselves loop over the predefined default 297636bfc99SJacob Faibussowitsch # arguments and check if they can be used 298636bfc99SJacob Faibussowitsch memcheck_args='--leak-check full --report-api-errors no ' 299636bfc99SJacob Faibussowitsch for option in "${default_args_to_check[@]}"; do 300636bfc99SJacob Faibussowitsch ${memcheck_cmd} ${memcheck_args} ${option} &> /dev/null 301636bfc99SJacob Faibussowitsch if [ $? -eq 0 ]; then 302636bfc99SJacob Faibussowitsch memcheck_args+="${option} " 303636bfc99SJacob Faibussowitsch fi 304636bfc99SJacob Faibussowitsch done 305636bfc99SJacob Faibussowitsch else 306636bfc99SJacob Faibussowitsch memcheck_args="${PETSC_CUDAMEMCHECK_ARGS}" 307636bfc99SJacob Faibussowitsch fi 308636bfc99SJacob Faibussowitsch pre_args=() 309*2ef0b79dSStefano Zampini # regex to detect where the test lives in the command line. This 310636bfc99SJacob Faibussowitsch # marks the end of the options to mpiexec, and hence where we should insert the 311636bfc99SJacob Faibussowitsch # cuda-memcheck command 312*2ef0b79dSStefano Zampini re="${executable}" 313636bfc99SJacob Faibussowitsch for i in "$@"; do 3140a6ed61bSStefano Zampini # first occurence of the presence of petsc_arch is the executable, 3150a6ed61bSStefano Zampini # except when we install MPI ourselves 316*2ef0b79dSStefano Zampini if [[ $i =~ ${re} ]]; then 317636bfc99SJacob Faibussowitsch # found it, put cuda memcheck command in 318636bfc99SJacob Faibussowitsch pre_args+=("${memcheck_cmd} ${memcheck_args}") 319636bfc99SJacob Faibussowitsch break 320636bfc99SJacob Faibussowitsch fi 321636bfc99SJacob Faibussowitsch pre_args+=("$i") 322636bfc99SJacob Faibussowitsch shift 323636bfc99SJacob Faibussowitsch done 324636bfc99SJacob Faibussowitsch # run command, but filter out 325636bfc99SJacob Faibussowitsch # ===== CUDA-MEMCHECK or ==== COMPUTE-SANITIZER 326636bfc99SJacob Faibussowitsch # and 327636bfc99SJacob Faibussowitsch # ===== ERROR SUMMARY: 0 errors 328636bfc99SJacob Faibussowitsch if ${printcmd}; then 3290a6ed61bSStefano Zampini echo ${pre_args[@]} "$@" 330636bfc99SJacob Faibussowitsch else 3310a6ed61bSStefano Zampini ${pre_args[@]} "$@" \ 332636bfc99SJacob Faibussowitsch | grep -v 'CUDA-MEMCHECK' \ 333636bfc99SJacob Faibussowitsch | grep -v 'COMPUTE-SANITIZER' \ 334636bfc99SJacob Faibussowitsch | grep -v 'LEAK SUMMARY: 0 bytes leaked in 0 allocations' \ 335636bfc99SJacob Faibussowitsch | grep -v 'ERROR SUMMARY: 0 errors' || [[ $? == 1 ]] 336636bfc99SJacob Faibussowitsch fi 337636bfc99SJacob Faibussowitsch # last or is needed to suppress grep exiting with error code 1 if it doesn't find a 338636bfc99SJacob Faibussowitsch # match 339baa5c0f4SScott Kruger} 340baa5c0f4SScott Kruger 34126646c0bSSatish Balayfunction petsc_mpiexec_valgrind() { 3420a6ed61bSStefano Zampini valgrind_cmd="valgrind -q --tool=memcheck --leak-check=yes --num-callers=20 --track-origins=yes --keep-debuginfo=yes --suppressions=${PETSC_DIR}/share/petsc/suppressions/valgrind --error-exitcode=10" 3430a6ed61bSStefano Zampini pre_args=() 344*2ef0b79dSStefano Zampini re="${executable}" 3450a6ed61bSStefano Zampini for i in "$@"; do 346*2ef0b79dSStefano Zampini if [[ $i =~ ${re} ]]; then 3470a6ed61bSStefano Zampini pre_args+=("${valgrind_cmd}") 3480a6ed61bSStefano Zampini break 34990544984SBarry Smith fi 3500a6ed61bSStefano Zampini pre_args+=("$i") 3510a6ed61bSStefano Zampini shift 3520a6ed61bSStefano Zampini done 3530a6ed61bSStefano Zampini if ${printcmd}; then 3540a6ed61bSStefano Zampini echo ${pre_args[@]} "$@" 35563cf4119SScott Kruger else 3560a6ed61bSStefano Zampini ${pre_args[@]} "$@" 35763cf4119SScott Kruger fi 35826646c0bSSatish Balay} 359296e37cfSJed Brownexport LC_ALL=C 360