#include "bench/bench.hpp" #include void allreduce(bench::State &state) { const int rank = bench::world_rank(); const int size = bench::world_size(); const size_t sz = 1000; char *data = new char[sz]; for (auto _ : state) { MPI_Allreduce(MPI_IN_PLACE, data, sz, MPI_BYTE, MPI_SUM, MPI_COMM_WORLD); } state.set_bytes_processed(sz * size); delete[] data; } int main(int argc, char **argv) { bench::init(argc, argv); bench::register_bench("allreduce", allreduce)->timing_max_rank(); bench::run_benchmarks(); bench::finalize(); }