diff --git a/src/common.cu b/src/common.cu index b7c3e0c0a8..99b1d59cdd 100644 --- a/src/common.cu +++ b/src/common.cu @@ -13,6 +13,7 @@ #include #include #include "cuda.h" +#include /* program_invocation_short_name */ #include "../verifiable/verifiable.h" @@ -1011,6 +1012,7 @@ testResult_t run() { #endif is_main_thread = is_main_proc = (proc == 0) ? 1 : 0; + PRINT("# Collective test starting: %s\n", program_invocation_short_name); PRINT("# nThread %d nGpus %d minBytes %ld maxBytes %ld step: %ld(%s) warmup iters: %d iters: %d agg iters: %d validation: %d graph: %d\n", nThreads, nGpus, minBytes, maxBytes, (stepFactor > 1)?stepFactor:stepBytes, (stepFactor > 1)?"factor":"bytes", @@ -1268,6 +1270,7 @@ testResult_t run() { PRINT("# Out of bounds values : %d %s\n", errors[0], errors[0] ? "FAILED" : "OK"); PRINT("# Avg bus bandwidth : %g %s\n", bw[0], check_avg_bw == -1 ? "" : (bw[0] < check_avg_bw*(0.9) ? "FAILED" : "OK")); PRINT("#\n"); + PRINT("# Collective test concluded: %s\n", program_invocation_short_name); #ifdef MPI_SUPPORT MPI_Comm_free(&mpi_comm); MPI_Finalize();