It might be better to benchmark MPI codes without synchronization because of overhead of timing individual steps

2020-03-31 12:37:54 +02:00
parent 742dcc2697
commit 9b6d927cf1
1 changed files with 15 additions and 1 deletions
--- a/samples/benchmark/main.cc
+++ b/samples/benchmark/main.cc
@@ -96,6 +96,20 @@ main(void)
    // Benchmark
    Timer t;
    const AcReal dt             = FLT_EPSILON;
+
+	acGridSynchronizeStream(STREAM_ALL);
+	timer_reset(&t);
+	acGridSynchronizeStream(STREAM_ALL);
+
+	const size_t num_iters = 50;
+	for (size_t i = 0; i < num_iters; ++i)
+		acGridIntegrate(STREAM_DEFAULT, dt);
+
+	acGridSynchronizeStream(STREAM_ALL);
+	if (!pid)
+		timer_diff_print(t);
+	acGridSynchronizeStream(STREAM_ALL);
+	/*
    const size_t num_iters      = 100;
    const double nth_percentile = 0.90;

@@ -135,7 +149,7 @@ main(void)
        fprintf(fp, "%d, %g\n", nprocs, results[nth_percentile * num_iters]);

        fclose(fp);
-    }
+    }*/

    acGridQuit();
    MPI_Finalize();