scriptname=`basename $0` rundir=${scriptname%.sh} TIMEOUT=60 if test "$PWD"!=`dirname $0`; then cd `dirname $0` abspath_scriptdir=$PWD fi if test -d "${rundir}" && test -n "${rundir}"; then rm -f ${rundir}/*.tmp ${rundir}/*.err ${rundir}/*.out fi mkdir -p ${rundir} if test -n "${runfiles}"; then for runfile in ${runfiles}; do subdir=`dirname ${runfile}` mkdir -p ${rundir}/${subdir} cp -r ${runfile} ${rundir}/${subdir} done fi cd ${rundir} # # Method to print out general and script specific options # print_usage() { cat >&2 < ......... Override default arguments -c ................ Cleanup (remove generated files) -C ................ Compile -d ................ Launch in debugger -e ......... Add extra arguments to default -f ................ force attempt to run test that would otherwise be skipped -h ................ help: print this message -n ...... Override the number of processors to use -j ................ Pass -j to petscdiff (just use diff) -J .......... Pass -J to petscdiff (just use diff with arg) -m ................ Update results using petscdiff -M ................ Update alt files using petscdiff -o .......... Output format: 'interactive', 'err_only' -p ................ Print command: Print first command and exit -t ................ Override the default timeout (default=$TIMEOUT sec) -U ................ run cUda-memcheck -V ................ run Valgrind -v ................ Verbose: Print commands EOF if declare -f extrausage > /dev/null; then extrausage; fi exit $1 } ### ## Arguments for overriding things # output_fmt="interactive" verbose=false cleanup=false compile=false debugger=false printcmd=false mpiexec_function=false force=false diff_flags="" while getopts "a:cCde:fhjJ:mMn:o:pt:UvV" arg do case $arg in a ) args="$OPTARG" ;; c ) cleanup=true ;; C ) compile=true ;; d ) debugger=true ;; e ) extra_args="$OPTARG" ;; f ) force=true ;; h ) print_usage; exit ;; n ) nsize="$OPTARG" ;; j ) diff_flags=$diff_flags" -j" ;; J ) diff_flags=$diff_flags" -J $OPTARG" ;; m ) diff_flags=$diff_flags" -m" ;; M ) diff_flags=$diff_flags" -M" ;; o ) output_fmt=$OPTARG ;; p ) printcmd=true ;; t ) TIMEOUT=$OPTARG ;; U ) mpiexec="petsc_mpiexec_cudamemcheck $mpiexec" mpiexec_function=true ;; V ) mpiexec="petsc_mpiexec_valgrind $mpiexec" mpiexec_function=true ;; v ) verbose=true ;; *) # To take care of any extra args if test -n "$OPTARG"; then eval $arg=\"$OPTARG\" else eval $arg=found fi ;; esac done shift $(( $OPTIND - 1 )) # Individual tests can extend the default export MPIEXEC_TIMEOUT=$((TIMEOUT*timeoutfactor)) STARTTIME=`date +%s` if test -n "$extra_args"; then args="$args $extra_args" fi if $debugger; then args="-start_in_debugger $args" fi if test -n "$filter"; then diff_flags=$diff_flags" -F \$'$filter'" fi if test -n "$filter_output"; then diff_flags=$diff_flags" -f \$'$filter_output'" fi # Init success=0; failed=0; failures=""; rmfiles="" total=0 todo=-1; skip=-1 job_level=0 if $compile; then curexec=`basename ${exec}` fullexec=${abspath_scriptdir}/${curexec} maketarget=`echo ${fullexec} | sed "s#${petsc_dir}/*##"` (cd $petsc_dir && make -f gmakefile.test ${maketarget}) fi ### ## Rest of code is functions # function petsc_report_tapoutput() { notornot=$1 test_label=$2 comment=$3 if test -n "$comment"; then comment=" # ${comment}" fi tap_message="${notornot} ok ${test_label}${comment}" # Log messages printf "${tap_message}\n" >> ${testlogtapfile} if test ${output_fmt} == "err_only"; then if test -n "${notornot}"; then printf "${tap_message}\n" | tee -a ${testlogerrfile} fi else printf "${tap_message}\n" fi } function printcmd() { # Print command that can be run from PETSC_DIR cmd="$1" basedir=`dirname ${PWD} | sed "s#${petsc_dir}/##"` modcmd=`echo ${cmd} | sed -e "s#\.\.#${basedir}#" | sed s#\>.*## | sed s#\%#\%\%#` if $mpiexec_function; then # Have to expand valgrind/cudamemcheck modcmd=`eval "$modcmd"` fi printf "${modcmd}\n" exit } function petsc_testrun() { # First arg = Basic command # Second arg = stdout file # Third arg = stderr file # Fourth arg = label for reporting rmfiles="${rmfiles} $2 $3" tlabel=$4 error=$5 cmd="$1 > $2 2> $3" if test -n "$error"; then cmd="$1 1> $2 2>&1" fi echo "$cmd" > ${tlabel}.sh; chmod 755 ${tlabel}.sh if $printcmd; then printcmd "$cmd" fi eval "{ time -p $cmd ; } 2>> timing.out" cmd_res=$? # If testing the error output then we don't test the error code itself if test -n "$error"; then cmd_res=0 fi # If it is a lack of GPU resources or MPI failure (Intel) then try once more # See: src/sys/error/err.c # Error #134 added to handle problems with the Radeon card for hip testing if [ $cmd_res -eq 96 -o $cmd_res -eq 97 -o $cmd_res -eq 98 -o $cmd_res -eq 134 ]; then printf "# retrying ${tlabel}\n" | tee -a ${testlogerrfile} sleep 3 eval "{ time -p $cmd ; } 2>> timing.out" cmd_res=$? fi touch "$2" "$3" # It appears current MPICH and Open MPI just shut down the job execution and do not return an error code to the executable # ETIMEDOUT=110 was used by Open MPI 3.0. MPICH used 255 # Earlier Open MPI versions returned 1 and the error string if [ $cmd_res -eq 110 -o $cmd_res -eq 255 ] || \ grep -F -q -s 'APPLICATION TIMED OUT' "$2" "$3" || \ grep -F -q -s MPIEXEC_TIMEOUT "$2" "$3" || \ grep -F -q -s 'APPLICATION TERMINATED WITH THE EXIT STRING: job ending due to timeout' "$2" "$3" || \ grep -q -s "Timeout after [0-9]* seconds. Terminating job" "$2" "$3"; then timed_out=1 # If timed out, then ensure non-zero error code if [ $cmd_res -eq 0 ]; then cmd_res=1 fi fi # Report errors comment="" if test $cmd_res == 0; then if "${verbose}"; then comment="${cmd}" fi petsc_report_tapoutput "" "$tlabel" "$comment" let success=$success+1 else if [ -n "$timed_out" ]; then comment="Exceeded timeout limit of $MPIEXEC_TIMEOUT s" else comment="Error code: ${cmd_res}" fi petsc_report_tapoutput "not" "$tlabel" "$comment" # Report errors in detail if [ -z "$timed_out" ]; then # We've had tests fail but stderr->stdout, as well as having # mpi_abort go to stderr which throws this test off. Show both # with stdout first awk '{print "#\t" $0}' < $2 | tee -a ${testlogerrfile} # if statement is for diff tests if test "$2" != "$3"; then awk '{print "#\t" $0}' < $3 | tee -a ${testlogerrfile} fi fi let failed=$failed+1 failures="$failures $tlabel" fi let total=$success+$failed return $cmd_res } function petsc_testend() { logfile=$1/counts/${label}.counts logdir=`dirname $logfile` if ! test -d "$logdir"; then mkdir -p $logdir fi if ! test -e "$logfile"; then touch $logfile fi printf "total $total\n" > $logfile printf "success $success\n" >> $logfile printf "failed $failed\n" >> $logfile printf "failures $failures\n" >> $logfile if test ${todo} -gt 0; then printf "todo $todo\n" >> $logfile fi if test ${skip} -gt 0; then printf "skip $skip\n" >> $logfile fi ENDTIME=`date +%s` timing=`touch timing.out && grep -E '(user|sys)' timing.out | awk '{if( sum1 == "" || $2 > sum1 ) { sum1=sprintf("%.2f",$2) } ; sum2 += sprintf("%.2f",$2)} END {printf "%.2f %.2f\n",sum1,sum2}'` printf "time $timing\n" >> $logfile if $cleanup; then echo "Cleaning up" /bin/rm -f $rmfiles fi } function petsc_mpiexec_cudamemcheck() { # loops over the argument list to find the call to the test executable and insert the # cuda memcheck command before it. # first check if compute-sanitizer exists, since cuda-memcheck is deprecated from CUDA # 11-ish onwards if command -v compute-sanitizer &> /dev/null; then memcheck_cmd="${PETSC_CUDAMEMCHECK_COMMAND:-compute-sanitizer}" declare -a default_args_to_check=('--target-processes all' '--track-stream-ordered-races all') else memcheck_cmd="${PETSC_CUDAMEMCHECK_COMMAND:-cuda-memcheck}" declare -a default_args_to_check=('--flush-to-disk yes') fi if [[ -z ${PETSC_CUDAMEMCHECK_ARGS} ]]; then # if user has not set the memcheck args themselves loop over the predefined default # arguments and check if they can be used memcheck_args='--leak-check full --report-api-errors no ' for option in "${default_args_to_check[@]}"; do ${memcheck_cmd} ${memcheck_args} ${option} &> /dev/null if [ $? -eq 0 ]; then memcheck_args+="${option} " fi done else memcheck_args="${PETSC_CUDAMEMCHECK_ARGS}" fi pre_args=() # regex to detect where the test lives in the command line. This # marks the end of the options to mpiexec, and hence where we should insert the # cuda-memcheck command re="${executable}" for i in "$@"; do # first occurrence of the presence of petsc_arch is the executable, # except when we install MPI ourselves if [[ $i =~ ${re} ]]; then # found it, put cuda memcheck command in pre_args+=("${memcheck_cmd} ${memcheck_args}") break fi pre_args+=("$i") shift done # run command, but filter out # ===== CUDA-MEMCHECK or ==== COMPUTE-SANITIZER # and # ===== ERROR SUMMARY: 0 errors if ${printcmd}; then echo ${pre_args[@]} "$@" else ${pre_args[@]} "$@" \ | grep -v 'CUDA-MEMCHECK' \ | grep -v 'COMPUTE-SANITIZER' \ | grep -v 'LEAK SUMMARY: 0 bytes leaked in 0 allocations' \ | grep -v 'ERROR SUMMARY: 0 errors' || [[ $? == 1 ]] fi # last or is needed to suppress grep exiting with error code 1 if it doesn't find a # match } function petsc_mpiexec_valgrind() { valgrind_cmd="valgrind -q --tool=memcheck --leak-check=yes --num-callers=20 --track-origins=yes --keep-debuginfo=yes --suppressions=${PETSC_DIR}/share/petsc/suppressions/valgrind --error-exitcode=10" pre_args=() re="${executable}" for i in "$@"; do if [[ $i =~ ${re} ]]; then pre_args+=("${valgrind_cmd}") break fi pre_args+=("$i") shift done if ${printcmd}; then echo ${pre_args[@]} "$@" else ${pre_args[@]} "$@" fi } export LC_ALL=C