Files
frontier-gpu-bandwidth/results/implicit_managed_GPURdHost_coarse.json
2023-10-10 13:23:18 -04:00

3195 lines
113 KiB
JSON

{
"context": {
"date": "2023-10-09T18:18:41-04:00",
"host_name": "frontier08444",
"executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope",
"num_cpus": 128,
"mhz_per_cpu": 1796,
"cpu_scaling_enabled": false,
"caches": [
{
"type": "Data",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Instruction",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Unified",
"level": 2,
"size": 524288,
"num_sharing": 2
},
{
"type": "Unified",
"level": 3,
"size": 33554432,
"num_sharing": 16
}
],
"load_avg": [2.44,2.61,4.37],
"library_build_type": "release"
},
"benchmarks": [
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 378,
"real_time": 1.8648067624968779e+06,
"cpu_time": 2.0648406243386250e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.1964742312043486e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 378,
"real_time": 1.8610708470097200e+06,
"cpu_time": 2.0649065132275133e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.2008834357817476e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 378,
"real_time": 1.8693731853904119e+06,
"cpu_time": 2.0691600449735466e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.1911087802110338e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 378,
"real_time": 1.8649951499937933e+06,
"cpu_time": 2.0646817010582001e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.1962523602346266e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 378,
"real_time": 1.8606357440129465e+06,
"cpu_time": 2.0647274232804223e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.2013981044811639e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8641763377807499e+06,
"cpu_time": 2.0656632613756615e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.1972233823825843e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_median",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8648067624968779e+06,
"cpu_time": 2.0648406243386250e+06,
"time_unit": "ns",
"bytes": 4.0960000000000000e+03,
"bytes_per_second": 2.1964742312043486e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.5445377342974380e+03,
"cpu_time": 1.9567925655588140e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 4.1748283407590170e+03,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.9013961621876993e-03,
"cpu_time": 9.4729504181415155e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.9000472934308547e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 378,
"real_time": 1.8644300473853331e+06,
"cpu_time": 2.0652232222222232e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.3938360741870785e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 378,
"real_time": 1.8596973342321464e+06,
"cpu_time": 2.0654901507936483e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.4050178753320677e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 378,
"real_time": 1.8637756724726709e+06,
"cpu_time": 2.0651562407407425e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.3953787577512879e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 378,
"real_time": 1.8601180756820005e+06,
"cpu_time": 2.0655041957671945e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.4040215011600563e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 378,
"real_time": 1.8597879068924128e+06,
"cpu_time": 2.0653520820105844e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.4048033486185586e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8615618073329129e+06,
"cpu_time": 2.0653451783068788e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.4006115114098107e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_median",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8601180756820005e+06,
"cpu_time": 2.0653520820105844e+06,
"time_unit": "ns",
"bytes": 8.1920000000000000e+03,
"bytes_per_second": 4.4040215011600563e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.3364151840360987e+03,
"cpu_time": 1.5566143114844516e+02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 5.5205034343749221e+03,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 1,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.2550833256423086e-03,
"cpu_time": 7.5368240032425347e-05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.2544855232190981e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 378,
"real_time": 1.8661257546761865e+06,
"cpu_time": 2.0682437222222215e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.7796869846228454e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 378,
"real_time": 1.8607013398121116e+06,
"cpu_time": 2.0675510740740723e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.8052819920333959e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 378,
"real_time": 1.8644182408352015e+06,
"cpu_time": 2.0674443941798911e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.7877277968812808e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 378,
"real_time": 1.8602370170892708e+06,
"cpu_time": 2.0676698439153426e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.8074798262192365e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 378,
"real_time": 1.8649194043107510e+06,
"cpu_time": 2.0673281957671980e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.7853662534308322e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8632803513447042e+06,
"cpu_time": 2.0676474460317451e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.7931085706375185e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_median",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8644182408352015e+06,
"cpu_time": 2.0675510740740721e+06,
"time_unit": "ns",
"bytes": 1.6384000000000000e+04,
"bytes_per_second": 8.7877277968812808e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.6453161960311218e+03,
"cpu_time": 3.5654077604780406e+02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.2487597332891444e+04,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 2,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.4197091672876992e-03,
"cpu_time": 1.7243789637932789e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.4201573007514984e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 373,
"real_time": 1.8673966829986472e+06,
"cpu_time": 2.0710252091152796e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7547423264874533e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 373,
"real_time": 1.8629985489489587e+06,
"cpu_time": 2.0714415656836429e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7588848911603611e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 373,
"real_time": 1.8668703551473778e+06,
"cpu_time": 2.0712717050938394e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7552370420180127e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 373,
"real_time": 1.8629668453583762e+06,
"cpu_time": 2.0713296139410157e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7589148235054322e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 373,
"real_time": 1.8669835951671770e+06,
"cpu_time": 2.0712617372654155e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7551305798734579e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8654432055241074e+06,
"cpu_time": 2.0712659662198387e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7565819326089438e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_median",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8668703551473778e+06,
"cpu_time": 2.0712717050938394e+06,
"time_unit": "ns",
"bytes": 3.2768000000000000e+04,
"bytes_per_second": 1.7552370420180127e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.2546804640957052e+03,
"cpu_time": 1.5239833262983336e+02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 2.1239882392859428e+04,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 3,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.2086567189067753e-03,
"cpu_time": 7.3577384611773328e-05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.2091597891658334e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 374,
"real_time": 1.8696007620922059e+06,
"cpu_time": 2.0773643101604285e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5053473088372581e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 374,
"real_time": 1.8651429145490467e+06,
"cpu_time": 2.0778865427807472e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5137253820490889e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 374,
"real_time": 1.8698107834841886e+06,
"cpu_time": 2.0776337700534768e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5049535802698068e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 374,
"real_time": 1.8655955613465335e+06,
"cpu_time": 2.0781554732620346e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5128728518574513e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 374,
"real_time": 1.8700520591022831e+06,
"cpu_time": 2.0779550160427734e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5045013683448203e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8680404161148514e+06,
"cpu_time": 2.0777990224598921e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5082800982716851e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_median",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8696007620922059e+06,
"cpu_time": 2.0778865427807469e+06,
"time_unit": "ns",
"bytes": 6.5536000000000000e+04,
"bytes_per_second": 3.5053473088372581e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.4488986229735824e+03,
"cpu_time": 3.0632259272775588e+02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 4.6013660108303709e+04,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 4,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.3109452032450128e-03,
"cpu_time": 1.4742647841132521e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.3115731589097412e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 377,
"real_time": 1.8790329355899051e+06,
"cpu_time": 2.0951603368700265e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 6.9755030642318755e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 377,
"real_time": 1.8700660362395651e+06,
"cpu_time": 2.0905375809018551e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 7.0089503504147366e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 377,
"real_time": 1.8762738437889593e+06,
"cpu_time": 2.0935442015915138e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 6.9857606571603835e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 377,
"real_time": 1.8711393336294247e+06,
"cpu_time": 2.0881779602122032e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 7.0049299720380172e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 377,
"real_time": 1.8759181648347680e+06,
"cpu_time": 2.0929391962864741e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 6.9870851755169660e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8744860628165249e+06,
"cpu_time": 2.0920718551724148e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 6.9924458438723966e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_median",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8759181648347680e+06,
"cpu_time": 2.0929391962864741e+06,
"time_unit": "ns",
"bytes": 1.3107200000000000e+05,
"bytes_per_second": 6.9870851755169660e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.7635873911800290e+03,
"cpu_time": 2.7374814741047749e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.4042243951733640e+05,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 5,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 2.0077969454331498e-03,
"cpu_time": 1.3085026058434160e-03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 2.0082020319169302e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 376,
"real_time": 1.8707361730853433e+06,
"cpu_time": 2.1079484680851074e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.4012879195448205e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 376,
"real_time": 1.8775200830745273e+06,
"cpu_time": 2.1113341223404217e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3962247454137847e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 376,
"real_time": 1.8767804861628509e+06,
"cpu_time": 2.1109846648936118e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3967749661334309e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 376,
"real_time": 1.8779481467410075e+06,
"cpu_time": 2.1113266888297824e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3959064868480256e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 376,
"real_time": 1.8802115801589296e+06,
"cpu_time": 2.1133979148936248e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3942260688440266e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8766392938445318e+06,
"cpu_time": 2.1109983718085098e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3968840373568174e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_median",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8775200830745273e+06,
"cpu_time": 2.1113266888297824e+06,
"time_unit": "ns",
"bytes": 2.6214400000000000e+05,
"bytes_per_second": 1.3962247454137847e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.5396640042457839e+03,
"cpu_time": 1.9545094082364278e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 2.6391827494510490e+05,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 6,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.8861717410778162e-03,
"cpu_time": 9.2586969006611954e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.8893356061573357e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 372,
"real_time": 1.8965987688442443e+06,
"cpu_time": 2.1628780591397770e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7643590653572577e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 372,
"real_time": 1.8908004268630838e+06,
"cpu_time": 2.1575007983870828e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7728362684464562e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 372,
"real_time": 1.8904735761386673e+06,
"cpu_time": 2.1574215107526937e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7733156740062428e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 372,
"real_time": 1.8929359388865673e+06,
"cpu_time": 2.1602722338709603e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7697080985655987e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 372,
"real_time": 1.8956099455501453e+06,
"cpu_time": 2.1621238225806425e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7658010617149442e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8932837312565416e+06,
"cpu_time": 2.1600392849462312e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7692040336181003e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_median",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8929359388865673e+06,
"cpu_time": 2.1602722338709603e+06,
"time_unit": "ns",
"bytes": 5.2428800000000000e+05,
"bytes_per_second": 2.7697080985655987e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.7652070074181111e+03,
"cpu_time": 2.5374621677357186e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 4.0437214671636326e+05,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 7,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.4605349223504329e-03,
"cpu_time": 1.1747296382152985e-03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.4602468500236557e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 368,
"real_time": 1.9129451950151555e+06,
"cpu_time": 2.2381212608695687e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4814743398421955e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 368,
"real_time": 1.9080894975480116e+06,
"cpu_time": 2.2350753315217514e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4954235707888520e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 368,
"real_time": 1.9133664918626889e+06,
"cpu_time": 2.2379742201087065e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4802673949787664e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 368,
"real_time": 1.9068620646145933e+06,
"cpu_time": 2.2342474755434897e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4989609340827370e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 368,
"real_time": 1.9144548041367671e+06,
"cpu_time": 2.2388767500000121e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4771520212137151e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.9111436106354434e+06,
"cpu_time": 2.2368590076087057e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4866556521812534e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_median",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.9129451950151552e+06,
"cpu_time": 2.2379742201087065e+06,
"time_unit": "ns",
"bytes": 1.0485760000000000e+06,
"bytes_per_second": 5.4814743398421955e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.4208972766209326e+03,
"cpu_time": 2.0560804143502164e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 9.8268915304891812e+05,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 8,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.7899739494111097e-03,
"cpu_time": 9.1918194546747550e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.7910530846933033e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 358,
"real_time": 1.9595538810358574e+06,
"cpu_time": 2.4178605027932944e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0702191046114055e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 358,
"real_time": 1.9586479721211062e+06,
"cpu_time": 2.4180118743016850e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0707140996495156e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 358,
"real_time": 1.9581921079310498e+06,
"cpu_time": 2.4169702849161969e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0709633602883681e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 358,
"real_time": 1.9597590383267102e+06,
"cpu_time": 2.4184585502793407e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0701070687703520e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 358,
"real_time": 1.9560512782896571e+06,
"cpu_time": 2.4133920949720680e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0721354921910428e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.9584408555408760e+06,
"cpu_time": 2.4169386614525169e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0708278251021369e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_median",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.9586479721211065e+06,
"cpu_time": 2.4178605027932944e+06,
"time_unit": "ns",
"bytes": 2.0971520000000000e+06,
"bytes_per_second": 1.0707140996495156e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.4825049492010874e+03,
"cpu_time": 2.0549192909473395e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 8.1106824719008699e+05,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 9,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 7.5698224176989697e-04,
"cpu_time": 8.5021573932388779e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 7.5742171446910832e-04,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 336,
"real_time": 2.0886270867777055e+06,
"cpu_time": 2.7940279970238050e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0081631740546336e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 336,
"real_time": 2.0956166283992517e+06,
"cpu_time": 2.8003795238095312e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0014653172531095e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 336,
"real_time": 2.0893180165633871e+06,
"cpu_time": 2.7943975624999949e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0074990818769646e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 336,
"real_time": 2.0890575258471514e+06,
"cpu_time": 2.7932564940476129e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0077494028313711e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 336,
"real_time": 2.0892365670685347e+06,
"cpu_time": 2.7945561309523741e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0075773448121979e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.0903711649312060e+06,
"cpu_time": 2.7953235416666637e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0064908641656556e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_median",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.0892365670685344e+06,
"cpu_time": 2.7943975624999953e+06,
"time_unit": "ns",
"bytes": 4.1943040000000000e+06,
"bytes_per_second": 2.0075773448121979e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.9444344550504084e+03,
"cpu_time": 2.8705589101259984e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 2.8210638441552506e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 10,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.4085701642116313e-03,
"cpu_time": 1.0269147264486160e-03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.4059689453549110e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 314,
"real_time": 2.2262953485771539e+06,
"cpu_time": 3.4548329394904450e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7679672669492111e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 314,
"real_time": 2.2315106860356061e+06,
"cpu_time": 3.4576669777069935e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7591610259786811e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 314,
"real_time": 2.2233449883616655e+06,
"cpu_time": 3.4526648312101783e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7729673280174947e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 314,
"real_time": 2.2301369407481165e+06,
"cpu_time": 3.4567410382165671e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7614766370292840e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 314,
"real_time": 2.2248323816972175e+06,
"cpu_time": 3.4547048025477692e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7704449418345551e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.2272240690839519e+06,
"cpu_time": 3.4553221178343915e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7664034399618454e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_median",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.2262953485771539e+06,
"cpu_time": 3.4548329394904450e+06,
"time_unit": "ns",
"bytes": 8.3886080000000000e+06,
"bytes_per_second": 3.7679672669492111e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.4817331819845081e+03,
"cpu_time": 1.9489259017035881e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 5.8862098602615250e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 11,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.5632612947724341e-03,
"cpu_time": 5.6403595243533161e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.5628197972124712e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 210,
"real_time": 3.3295433059157361e+06,
"cpu_time": 5.6089175809523864e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0388940639970751e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 210,
"real_time": 3.3301346103793806e+06,
"cpu_time": 5.6104858523809751e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0379993492481318e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 210,
"real_time": 3.3388836131918998e+06,
"cpu_time": 5.6174360714285923e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0247980893114595e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 210,
"real_time": 3.3304111100733280e+06,
"cpu_time": 5.6087122380952379e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0375810809827032e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 210,
"real_time": 3.3314077083819681e+06,
"cpu_time": 5.6085922047619047e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0360740769698610e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.3320760695884628e+06,
"cpu_time": 5.6108287895238195e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0350693321018467e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_median",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.3304111100733280e+06,
"cpu_time": 5.6089175809523864e+06,
"time_unit": "ns",
"bytes": 1.6777216000000000e+07,
"bytes_per_second": 5.0375810809827032e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 3.8647639797008828e+03,
"cpu_time": 3.7718894345740910e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 5.8316035034491159e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 12,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.1598666714047170e-03,
"cpu_time": 6.7225174320355698e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.1581972598210008e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 104,
"real_time": 6.6526710243824013e+06,
"cpu_time": 1.0952665192307701e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0437533852224445e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 104,
"real_time": 6.6722296402216535e+06,
"cpu_time": 1.0970076971153922e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0289683972695694e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 104,
"real_time": 6.6576325200283183e+06,
"cpu_time": 1.0960438711538408e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0399946075511656e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 104,
"real_time": 6.6694835012850277e+06,
"cpu_time": 1.0967630932692228e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0310390592517357e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 104,
"real_time": 6.6715926558782272e+06,
"cpu_time": 1.0977876605769219e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0294485486064196e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 6.6647218683591262e+06,
"cpu_time": 1.0965737682692297e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0346407995802670e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_median",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 6.6694835012850286e+06,
"cpu_time": 1.0967630932692230e+07,
"time_unit": "ns",
"bytes": 3.3554432000000000e+07,
"bytes_per_second": 5.0310390592517357e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 8.9684057659686623e+03,
"cpu_time": 9.6012547801365145e+03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 6.7788389201927492e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 13,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.3456534185689450e-03,
"cpu_time": 8.7556852607285993e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.3464394363065374e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 52,
"real_time": 1.3572544647523990e+07,
"cpu_time": 2.2267987884615462e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9444570449243298e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 52,
"real_time": 1.3253713814684978e+07,
"cpu_time": 2.1369407249999847e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 5.0634007145713434e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 52,
"real_time": 1.3583027883074604e+07,
"cpu_time": 2.2290338423076969e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9406409658940849e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 52,
"real_time": 1.3578680039455112e+07,
"cpu_time": 2.2278848615384616e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9422229410372763e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 52,
"real_time": 1.3542058143334894e+07,
"cpu_time": 2.2242661134615269e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9555882340550671e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.3506004905614719e+07,
"cpu_time": 2.2089848661538433e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9692619800964203e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_median",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.3572544647523990e+07,
"cpu_time": 2.2267987884615462e+07,
"time_unit": "ns",
"bytes": 6.7108864000000000e+07,
"bytes_per_second": 4.9444570449243298e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.4194398710524556e+05,
"cpu_time": 4.0312472921602387e+05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 5.2949574019689336e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 14,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.0509694620815413e-02,
"cpu_time": 1.8249320554102361e-02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.0655420107003885e-02,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 27,
"real_time": 2.6283959961599775e+07,
"cpu_time": 4.2580222370370246e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1064500248854752e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 27,
"real_time": 2.6292765857996766e+07,
"cpu_time": 4.2623691592592858e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1047397875480108e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 27,
"real_time": 2.6265470380032506e+07,
"cpu_time": 4.2567152296295829e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1100447110985222e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 27,
"real_time": 2.6286946609616280e+07,
"cpu_time": 4.2653314962963045e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1058698445752745e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 27,
"real_time": 2.6110613235720880e+07,
"cpu_time": 4.1675103074074067e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1403514267670326e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.6247951208993241e+07,
"cpu_time": 4.2419896859259203e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1134911589748640e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_median",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 2.6283959961599775e+07,
"cpu_time": 4.2580222370370239e+07,
"time_unit": "ns",
"bytes": 1.3421772800000000e+08,
"bytes_per_second": 5.1064500248854752e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 7.7450410836494513e+04,
"cpu_time": 4.1776863219146163e+05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.5145960625666501e+07,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 15,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 2.9507221428374934e-03,
"cpu_time": 9.8484122575199801e-03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 2.9619608511659017e-03,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 10,
"real_time": 5.1235353946685791e+07,
"cpu_time": 8.1178326299999520e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.2392622539375277e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 10,
"real_time": 5.1293835416436195e+07,
"cpu_time": 8.1084651799999103e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.2332888313121662e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 10,
"real_time": 4.7543637081980705e+07,
"cpu_time": 7.9450426600000411e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.6460858376722403e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 10,
"real_time": 5.1264522597193718e+07,
"cpu_time": 8.1066110899999440e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.2362812018987665e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 10,
"real_time": 5.1219387352466583e+07,
"cpu_time": 8.1066656000000134e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.2408954865617485e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 5.0511347278952599e+07,
"cpu_time": 8.0769234319999725e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.3191627222764902e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_median",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 5.1235353946685791e+07,
"cpu_time": 8.1066656000000134e+07,
"time_unit": "ns",
"bytes": 2.6843545600000000e+08,
"bytes_per_second": 5.2392622539375277e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.6592446292773630e+06,
"cpu_time": 7.3869709566962335e+05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.8277871865779036e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 16,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 3.2848948180179464e-02,
"cpu_time": 9.1457731633678551e-03,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 3.4362310047842438e-02,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 8,
"real_time": 1.0126967169344425e+08,
"cpu_time": 1.5925211775000036e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.3013987605803070e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 8,
"real_time": 8.9620835147798061e+07,
"cpu_time": 1.5567606137500077e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.9904698624446001e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 8,
"real_time": 1.0153957735747099e+08,
"cpu_time": 1.5948143000000137e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.2873069395388670e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 8,
"real_time": 8.9733739383518696e+07,
"cpu_time": 1.5653525349999952e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.9829325701610794e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 8,
"real_time": 1.0150537919253111e+08,
"cpu_time": 1.5931481287499949e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.2890882854758463e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 9.6733840554952621e+07,
"cpu_time": 1.5805193510000032e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.5702392836401405e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_median",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.0126967169344425e+08,
"cpu_time": 1.5925211775000036e+08,
"time_unit": "ns",
"bytes": 5.3687091200000000e+08,
"bytes_per_second": 5.3013987605803070e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 6.4426840997056458e+06,
"cpu_time": 1.8044288133633323e+06,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 3.8022404909745514e+08,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 17,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 6.6602174200306688e-02,
"cpu_time": 1.1416682827841749e-02,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 6.8259913037161210e-02,
"dst_gpu": NaN,
"src_numa": NaN
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 0,
"threads": 1,
"iterations": 4,
"real_time": 1.8767516687512398e+08,
"cpu_time": 2.8531457724999851e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7212781098228645e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 1,
"threads": 1,
"iterations": 4,
"real_time": 1.8765720352530479e+08,
"cpu_time": 2.8563844199999976e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7218257750239277e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 2,
"threads": 1,
"iterations": 4,
"real_time": 1.8773095682263374e+08,
"cpu_time": 2.8582995374999952e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7195778585119562e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 3,
"threads": 1,
"iterations": 4,
"real_time": 1.8751276284456253e+08,
"cpu_time": 2.8545517099999887e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7262332851981449e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "iteration",
"repetitions": 5,
"repetition_index": 4,
"threads": 1,
"iterations": 4,
"real_time": 1.8726067990064621e+08,
"cpu_time": 2.8510142275000304e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7339417146711674e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8756735399365425e+08,
"cpu_time": 2.8546791334999996e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7245713486456118e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_median",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8765720352530479e+08,
"cpu_time": 2.8545517099999887e+08,
"time_unit": "ns",
"bytes": 1.0737418240000000e+09,
"bytes_per_second": 5.7218257750239277e+09,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 5,
"real_time": 1.8940144816571317e+05,
"cpu_time": 2.8202081426441885e+05,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 5.7854198794970792e+06,
"dst_gpu": 0.0000000000000000e+00,
"src_numa": 0.0000000000000000e+00
},
{
"name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 18,
"run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time",
"run_type": "aggregate",
"repetitions": 5,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 5,
"real_time": 1.0097783230024185e-03,
"cpu_time": 9.8792474066479495e-04,
"time_unit": "ns",
"bytes": 0.0000000000000000e+00,
"bytes_per_second": 1.0106293601993210e-03,
"dst_gpu": NaN,
"src_numa": NaN
}
]
}